accel_cores.c 6.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249
  1. // This file is Copyright (c) 2023 Victor Suarez Rovere <suarezvictor@gmail.com>
  2. // SPDX-License-Identifier: AGPL-3.0-only
  3. #include <stdio.h>
  4. #include <stdlib.h> //abs
  5. #include <string.h> //memcpy
  6. #include "misc.h" //just for ACCEL_STATIC_ASSERT
  7. #include "accel_cores.h"
  8. #include "graphics.h"
  9. #include "sw_cores.h"
  10. #include "bmp.h"
  11. //#define INDUCE_RENDERING_ERRORS //enable to induce errors in softwre renderer
  12. unsigned accel_rectangle_fill(accel_rectangle_fill32_layout_t *regs, int x0, int y0, int x1, int y1, uint32_t rgba)
  13. {
  14. accel_rectangle_fill32_layout_t sw_args;
  15. int sw_render = !regs;
  16. uintptr_t fb_base = VIDEO_FRAMEBUFFER_BASE;
  17. #ifdef VRAM_ORIGIN_ACCEL_RECTANGLE_FILL32
  18. if(!sw_render) fb_base = VRAM_ORIGIN_ACCEL_RECTANGLE_FILL32;
  19. #endif
  20. if(sw_render)
  21. regs = &sw_args;
  22. else
  23. {
  24. regs->run = 0; //stps
  25. while(regs->done); //wait data latch
  26. }
  27. fb_base += (y0<y1?y0:y1)*FRAME_PITCH + (x0<x1?x0:x1)*sizeof(rgba);
  28. regs->x0 = x0 < x1 ? x0 : x1;
  29. regs->x1 = 1 + (x1 > x0 ? x1 : x0);
  30. regs->y0 = y0 < y1 ? y0 : y1;
  31. regs->y1 = 1 + (y1 > y0 ? y1 : y0);
  32. regs->base = fb_base;
  33. regs->xstride = SDRAM_BUS_BITS/8;
  34. regs->ystride = FRAME_PITCH;
  35. regs->rgba = rgba;
  36. if(sw_render)
  37. {
  38. //printf("sw_rectangle_fill\n");
  39. sw_rectangle_fill(regs);
  40. }
  41. else
  42. {
  43. regs->run = 1; //start
  44. while(!regs->done); //wait until done
  45. }
  46. return (abs(x1-x0)+1)*(abs(y1-y0)+1);
  47. }
  48. unsigned accel_ellipse_fill(accel_ellipse_fill32_layout_t *regs, int x0, int y0, int x1, int y1, uint32_t rgba)
  49. {
  50. accel_ellipse_fill32_layout_t sw_args;
  51. int sw_render = !regs;
  52. uintptr_t fb_base = VIDEO_FRAMEBUFFER_BASE;
  53. #ifdef VRAM_ORIGIN_ACCEL_ELLIPSE_FILL32
  54. if(!sw_render) fb_base = VRAM_ORIGIN_ACCEL_ELLIPSE_FILL32;
  55. #endif
  56. if(sw_render)
  57. regs = &sw_args;
  58. else
  59. {
  60. regs->run = 0; //stops
  61. while(regs->done); //wait data latch
  62. }
  63. fb_base += (y0<y1?y0:y1)*FRAME_PITCH + (x0<x1?x0:x1)*sizeof(rgba);
  64. regs->x0 = x0 < x1 ? x0 : x1;
  65. regs->x1 = 1 + (x1 > x0 ? x1 : x0);
  66. regs->y0 = y0 < y1 ? y0 : y1;
  67. regs->y1 = 1 + (y1 > y0 ? y1 : y0);
  68. regs->base = fb_base;
  69. regs->xstride = SDRAM_BUS_BITS/8;
  70. regs->ystride = FRAME_PITCH;
  71. regs->rgba = rgba;
  72. if(sw_render)
  73. {
  74. //printf("sw_ellipse_fill\n");
  75. #ifdef INDUCE_RENDERING_ERRORS
  76. ++regs->y1;
  77. #endif
  78. sw_ellipse_fill(regs);
  79. }
  80. else
  81. {
  82. regs->run = 1; //start
  83. while(!regs->done); //wait until done
  84. }
  85. return (abs(x1-x0)+1)*(abs(y1-y0)+1);
  86. }
  87. unsigned accel_line(accel_line32_layout_t *regs, int x0, int y0, int x1, int y1, uint32_t rgba)
  88. {
  89. accel_line32_layout_t sw_args;
  90. int sw_render = !regs;
  91. uintptr_t fb_base = VIDEO_FRAMEBUFFER_BASE;
  92. #ifdef VRAM_ORIGIN_ACCEL_ELLIPSE_FILL32
  93. if(!sw_render) fb_base = VRAM_ORIGIN_ACCEL_ELLIPSE_FILL32;
  94. #endif
  95. if(sw_render)
  96. regs = &sw_args;
  97. else
  98. {
  99. regs->run = 0; //stops
  100. while(regs->done); //wait data latch
  101. }
  102. fb_base += y0*FRAME_PITCH + x0*sizeof(rgba);
  103. regs->x0 = x0;
  104. regs->x1 = x1;
  105. regs->y0 = y0;
  106. regs->y1 = y1;
  107. regs->base = fb_base;
  108. regs->xstride = x0 < x1 ? SDRAM_BUS_BITS/8 : -SDRAM_BUS_BITS/8;
  109. regs->ystride = y0 < y1 ? FRAME_PITCH : -FRAME_PITCH;
  110. regs->rgba = rgba;
  111. if(sw_render)
  112. {
  113. //printf("sw_line\n");
  114. #ifdef INDUCE_RENDERING_ERRORS
  115. ++regs->y1;
  116. #endif
  117. sw_line(regs);
  118. }
  119. else
  120. {
  121. regs->run = 1; //start
  122. while(!regs->done); //wait until done
  123. }
  124. return abs(x1-x0)+abs(y1-y0);
  125. }
  126. unsigned accel_rectangle(accel_line32_layout_t *regs, int x0, int y0, int x1, int y1, uint32_t rgba)
  127. {
  128. return accel_line(regs, x0, y0, x1, y0, rgba)
  129. + accel_line(regs, x1, y0, x1, y1, rgba)
  130. + accel_line(regs, x1, y1, x0, y1, rgba)
  131. + accel_line(regs, x0, y1, x0, y0, rgba);
  132. }
  133. //example command for PNG to BMP (32-bit)
  134. //$ convert input.png -alpha on output.bmp
  135. void accel_bmp_decode(const void *coded_buf, size_t coded_len, void *dst, unsigned writer_stride,
  136. unsigned *decoded_width, unsigned *decoded_height, int wait_done)
  137. {
  138. BMPHeader *bmp = (BMPHeader *) coded_buf;
  139. assert(bmp->type == 0x4D42);
  140. assert(bmp->bits_per_pixel == 32 && bmp->compression == 3); //check RGBA32 format
  141. unsigned w = bmp->width_px, h = bmp->height_px;
  142. uint32_t *data = ((uint8_t*)bmp) + bmp->offset;
  143. uint8_t *fb = (uint8_t *) dst;
  144. fb += h * writer_stride;
  145. while(h--)
  146. {
  147. fb -= writer_stride;
  148. memcpy(fb, data, w*sizeof(uint32_t));
  149. data += w;
  150. }
  151. if(decoded_width) *decoded_width = w;
  152. if(decoded_height) *decoded_height = h;
  153. }
  154. #ifdef CSR_JPEG_DECODER_BASE
  155. /*
  156. Example converting a video file
  157. wget http://download.blender.org/peach/bigbuckbunny_movies/big_buck_bunny_480p_surround-fix.avi
  158. ffmpeg -i big_buck_bunny_480p_surround-fix.avi -vf "scale=640:480" frame%05d.png
  159. (for file in frame*.png; do convert "$file" ppm:- | cjpeg -quality 90 -sample 2x2 -baseline -outfile "${file%.png}.jpeg"; echo "${file%.png}.jpeg"; done;) | tar -T - -cvf big_buck_bunny_480p_surround-fix.jpeg.tar
  160. rm frame*.png frame*.jpeg
  161. At same resolution, resulting size is about 4X the original file (no audio)
  162. */
  163. void accel_jpeg_decode(const void *coded_buf, size_t coded_len, void *dst, unsigned writer_stride,
  164. unsigned *decoded_width, unsigned *decoded_height, int wait_done)
  165. {
  166. accel_jpeg_decode_waitdone(NULL, NULL);
  167. coded_len = (coded_len + 3) & ~3;
  168. jpeg_decoder_reader_base_write((intptr_t) coded_buf);
  169. jpeg_decoder_reader_length_write(coded_len);
  170. jpeg_decoder_writer_base_write((intptr_t) dst);
  171. jpeg_decoder_writer_stride_write(writer_stride);
  172. jpeg_decoder_reader_enable_write(1); //start decoding
  173. if(wait_done)
  174. accel_jpeg_decode_waitdone(decoded_width, decoded_height);
  175. }
  176. void accel_jpeg_decode_waitdone(unsigned *decoded_width, unsigned *decoded_height)
  177. {
  178. int count = 0;
  179. while(!jpeg_decoder_idle_status_read())
  180. {
  181. if(count++>100)
  182. {
  183. jpeg_decoder_reader_enable_write(0);
  184. printf("DECODING ERROR\n");
  185. return;
  186. }
  187. printf("idle %ld, byte read offset %ld (of %d), write offset %ld (%d,%d)\n", jpeg_decoder_idle_status_read(),
  188. jpeg_decoder_reader_offset_read()*4, jpeg_decoder_reader_length_read(),
  189. jpeg_decoder_outport_pixel_offset_read(), jpeg_decoder_outport_x_read(), jpeg_decoder_outport_y_read());
  190. }
  191. /*
  192. if(decoded_width && decoded_height)
  193. {
  194. printf("FINAL idle %ld, byte read offset %ld, write offset %ld (%d,%d)\n", jpeg_decoder_idle_status_read(),
  195. jpeg_decoder_reader_offset_read()*4, jpeg_decoder_outport_pixel_offset_read()*4,
  196. jpeg_decoder_outport_x_read(), jpeg_decoder_outport_y_read());
  197. }
  198. */
  199. if(decoded_width)
  200. *decoded_width = jpeg_decoder_outport_width_read();
  201. if(decoded_height)
  202. *decoded_height = jpeg_decoder_outport_height_read();
  203. jpeg_decoder_reader_enable_write(0);
  204. //jpeg_decoder_reader_enable_write(0);
  205. //printf("RESET size (%d,%d)\n", jpeg_decoder_outport_width_read(), jpeg_decoder_outport_height_read());
  206. }
  207. #else
  208. #warning implement software JPEG decoder
  209. #endif