removed clang-format and clang_complete files from the repo
[dosdemo] / src / dos / gfx.c
1 #include <stdio.h>
2 #include <stdlib.h>
3 #include <string.h>
4 #include <dos.h>
5 #include "demo.h"
6 #include "cdpmi.h"
7 #include "gfx.h"
8 #include "vbe.h"
9 #include "vga.h"
10 #include "util.h"
11 #include "cpuid.h"
12
13 #ifdef __DJGPP__
14 #define VMEM_PTR        ((void*)(0xa0000 + __djgpp_conventional_base))
15 #else
16 #define VMEM_PTR        ((void*)0xa0000)
17 #endif
18
19 #define SAME_BPP(a, b)  \
20         ((a) == (b) || ((a) == 16 && (b) == 15) || ((a) == 15 && (b) == 16) || \
21          ((a) == 32 && (b) == 24) || ((a) == 24 && (b) == 32))
22
23 void (*blit_frame)(void*, int);
24
25 static void blit_frame_lfb(void *pixels, int vsync);
26 static void blit_frame_banked(void *pixels, int vsync);
27 static uint32_t calc_mask(int sz, int pos);
28
29 static void enable_wrcomb(uint32_t addr, int len);
30 static const char *mtrr_type_name(int type);
31 static void print_mtrr(void);
32
33 static struct video_mode *vmodes;
34 static int num_vmodes;
35
36 static int vbe_init_ver;
37 static struct vbe_info vbe;
38
39 /* current mode */
40 static struct video_mode *curmode;
41 static void *vpgaddr[2];
42 static int frontidx, backidx;
43 static int pgcount, pgsize, fbsize;
44
45
46 int init_video(void)
47 {
48         int i, num, max_modes;
49         struct video_mode *vmptr;
50
51         if(vbe_info(&vbe) == -1) {
52                 fprintf(stderr, "failed to retrieve VBE information\n");
53                 return -1;
54         }
55         vbe_print_info(stdout, &vbe);
56
57         num_vmodes = 0;
58         max_modes = 64;
59         if(!(vmodes = malloc(max_modes * sizeof *vmodes))) {
60                 fprintf(stderr, "failed to allocate video modes list\n");
61                 return -1;
62         }
63
64         num = vbe_num_modes(&vbe);
65         for(i=0; i<num; i++) {
66                 struct vbe_mode_info minf;
67
68                 if(vbe_mode_info(vbe.modes[i], &minf) == -1) {
69                         continue;
70                 }
71
72                 if(num_vmodes >= max_modes) {
73                         int newmax = max_modes ? (max_modes << 1) : 16;
74                         if(!(vmptr = realloc(vmodes, newmax * sizeof *vmodes))) {
75                                 fprintf(stderr, "failed to grow video mode list (%d)\n", newmax);
76                                 free(vmodes);
77                                 return -1;
78                         }
79                         vmodes = vmptr;
80                         max_modes = newmax;
81                 }
82
83                 vmptr = vmodes + num_vmodes++;
84                 memset(vmptr, 0, sizeof *vmptr);
85                 vmptr->mode = vbe.modes[i];
86                 vmptr->xsz = minf.xres;
87                 vmptr->ysz = minf.yres;
88                 vmptr->bpp = minf.bpp;
89                 vmptr->pitch = minf.scanline_bytes;
90                 if(minf.mem_model == VBE_TYPE_DIRECT) {
91                         vmptr->rbits = minf.rsize;
92                         vmptr->gbits = minf.gsize;
93                         vmptr->bbits = minf.bsize;
94                         vmptr->rshift = minf.rpos;
95                         vmptr->gshift = minf.gpos;
96                         vmptr->bshift = minf.bpos;
97                         vmptr->rmask = calc_mask(minf.rsize, minf.rpos);
98                         vmptr->gmask = calc_mask(minf.gsize, minf.gpos);
99                         vmptr->bmask = calc_mask(minf.bsize, minf.bpos);
100                         /*vmptr->bpp = vmptr->rbits + vmptr->gbits + vmptr->bbits;*/
101                 }
102                 if(minf.attr & VBE_ATTR_LFB) {
103                         vmptr->fb_addr = minf.fb_addr;
104                 }
105                 vmptr->max_pages = minf.num_img_pages;
106                 vmptr->win_gran = minf.win_gran;
107
108                 printf("%04x: ", vbe.modes[i]);
109                 vbe_print_mode_info(stdout, &minf);
110         }
111         fflush(stdout);
112
113         vbe_init_ver = VBE_VER_MAJOR(vbe.ver);
114         return 0;
115 }
116
117 void cleanup_video(void)
118 {
119         free(vmodes);
120 }
121
122 struct video_mode *video_modes(void)
123 {
124         return vmodes;
125 }
126
127 int num_video_modes(void)
128 {
129         return num_vmodes;
130 }
131
132 struct video_mode *get_video_mode(int idx)
133 {
134         if(idx == VMODE_CURRENT) {
135                 return curmode;
136         }
137         return vmodes + idx;
138 }
139
140 int match_video_mode(int xsz, int ysz, int bpp)
141 {
142         int i, best = -1;
143         struct video_mode *vm;
144
145         for(i=0; i<num_vmodes; i++) {
146                 vm = vmodes + i;
147                 if(vm->xsz != xsz || vm->ysz != ysz) continue;
148                 if(SAME_BPP(vm->bpp, bpp)) {
149                         best = i;
150                 }
151                 if(vm->bpp == bpp) break;
152         }
153
154         if(best == -1) {
155                 fprintf(stderr, "failed to find video mode %dx%d %d bpp)\n", xsz, ysz, bpp);
156                 return -1;
157         }
158         return best;
159 }
160
161 int find_video_mode(int mode)
162 {
163         int i;
164         struct video_mode *vm;
165
166         vm = vmodes;
167         for(i=0; i<num_vmodes; i++) {
168                 if(vm->mode == mode) return i;
169         }
170         return -1;
171 }
172
173 void *set_video_mode(int idx, int nbuf)
174 {
175         unsigned int mode;
176         struct video_mode *vm = vmodes + idx;
177
178         if(curmode == vm) return vpgaddr[0];
179
180         printf("setting video mode %x (%dx%d %d bpp)\n", (unsigned int)vm->mode,
181                         vm->xsz, vm->ysz, vm->bpp);
182         fflush(stdout);
183
184         mode = vm->mode | VBE_MODE_LFB;
185         if(vbe_setmode(mode) == -1) {
186                 mode = vm->mode;
187                 if(vbe_setmode(mode) == -1) {
188                         fprintf(stderr, "failed to set video mode %x\n", (unsigned int)vm->mode);
189                         return 0;
190                 }
191                 printf("Warning: failed to get a linear framebuffer. falling back to banked mode\n");
192         }
193
194         /* unmap previous video memory mapping, if there was one (switching modes) */
195         if(vpgaddr[0] && vpgaddr[0] != VMEM_PTR) {
196                 dpmi_munmap(vpgaddr[0]);
197                 vpgaddr[0] = vpgaddr[1] = 0;
198         }
199
200         curmode = vm;
201         if(nbuf < 1) nbuf = 1;
202         if(nbuf > 2) nbuf = 2;
203         pgcount = nbuf > vm->max_pages + 1 ? vm->max_pages + 1 : nbuf;
204         pgsize = vm->ysz * vm->pitch;
205         fbsize = pgcount * pgsize;
206
207         if(vm->bpp > 8) {
208                 printf("rgb mask: %x %x %x\n", (unsigned int)vm->rmask,
209                                 (unsigned int)vm->gmask, (unsigned int)vm->bmask);
210                 printf("rgb shift: %d %d %d\n", vm->rshift, vm->gshift, vm->bshift);
211         }
212         printf("pgcount: %d, pgsize: %d, fbsize: %d\n", pgcount, pgsize, fbsize);
213         if(vm->fb_addr) {
214                 printf("phys addr: %p\n", (void*)vm->fb_addr);
215         }
216         fflush(stdout);
217
218         if(vm->fb_addr) {
219                 vpgaddr[0] = (void*)dpmi_mmap(vm->fb_addr, fbsize);
220                 if(!vpgaddr[0]) {
221                         fprintf(stderr, "failed to map framebuffer (phys: %lx, size: %d)\n",
222                                         (unsigned long)vm->fb_addr, fbsize);
223                         set_text_mode();
224                         return 0;
225                 }
226                 memset(vpgaddr[0], 0xaa, pgsize);
227
228                 if(pgcount > 1) {
229                         vpgaddr[1] = (char*)vpgaddr[0] + pgsize;
230                         backidx = 1;
231                         page_flip(FLIP_NOW);    /* start with the second page visible */
232                 } else {
233                         frontidx = backidx = 0;
234                         vpgaddr[1] = 0;
235                 }
236
237                 blit_frame = blit_frame_lfb;
238
239                 /* only attempt to set up write combining if the CPU we're running on
240                  * supports memory type range registers, and we're running on ring 0
241                  */
242                 if(CPU_HAVE_MTRR) {
243                         int cpl = get_cpl();
244                         if(cpl > 0) {
245                                 fprintf(stderr, "Can't set framebuffer range to write-combining, running in ring %d\n", cpl);
246                         } else {
247                                 uint32_t len = (uint32_t)vbe.vmem_blk << 16;
248
249                                 /* if vmem_blk is 0 or if the reported size is absurd (more than
250                                  * 256mb), just use the framebuffer size for this mode to setup the
251                                  * mtrr
252                                  */
253                                 if(!len || len > 0x10000000) {
254                                         printf("reported vmem too large or overflowed, using fbsize for wrcomb setup\n");
255                                         len = fbsize;
256                                 }
257                                 print_mtrr();
258                                 enable_wrcomb(vm->fb_addr, len);
259                         }
260                 }
261
262         } else {
263                 vpgaddr[0] = VMEM_PTR;
264                 vpgaddr[1] = 0;
265
266                 blit_frame = blit_frame_banked;
267
268                 /* calculate window granularity shift */
269                 vm->win_gran_shift = 0;
270                 vm->win_64k_step = 1;
271                 if(vm->win_gran > 0 && vm->win_gran < 64) {
272                         int gran = vm->win_gran;
273                         while(gran < 64) {
274                                 vm->win_gran_shift++;
275                                 gran <<= 1;
276                         }
277                         vm->win_64k_step = 1 << vm->win_gran_shift;
278                 }
279
280                 printf("granularity: %dk (step: %d)\n", vm->win_gran, vm->win_64k_step);
281         }
282
283         /* allocate main memory framebuffer */
284         if(demo_resizefb(vm->xsz, vm->ysz, vm->bpp) == -1) {
285                 fprintf(stderr, "failed to allocate %dx%d (%d bpp) framebuffer\n", vm->xsz,
286                                 vm->ysz, vm->bpp);
287                 set_text_mode();
288                 return 0;
289         }
290
291         fflush(stdout);
292         return vpgaddr[0];
293 }
294
295 int set_text_mode(void)
296 {
297         /* unmap previous video memory mapping, if there was one (switching modes) */
298         if(vpgaddr[0] && vpgaddr[0] != VMEM_PTR) {
299                 dpmi_munmap(vpgaddr[0]);
300                 vpgaddr[0] = vpgaddr[1] = 0;
301         }
302
303         vga_setmode(3);
304         curmode = 0;
305         return 0;
306 }
307
308 void *page_flip(int vsync)
309 {
310         if(!vpgaddr[1]) {
311                 /* page flipping not supported */
312                 return vpgaddr[0];
313         }
314
315         vbe_swap(backidx ? pgsize : 0, vsync ? VBE_SWAP_VBLANK : VBE_SWAP_NOW);
316         frontidx = backidx;
317         backidx = (backidx + 1) & 1;
318
319         return vpgaddr[backidx];
320 }
321
322
323 static void blit_frame_lfb(void *pixels, int vsync)
324 {
325         demo_post_draw(pixels);
326
327         if(vsync) wait_vsync();
328         memcpy64(vpgaddr[frontidx], pixels, pgsize >> 3);
329 }
330
331 static void blit_frame_banked(void *pixels, int vsync)
332 {
333         int sz, offs, pending;
334         unsigned char *pptr = pixels;
335
336         demo_post_draw(pixels);
337
338         if(vsync) wait_vsync();
339
340         /* assume initial window offset at 0 */
341         offs = 0;
342         pending = pgsize;
343         while(pending > 0) {
344                 sz = pending > 65536 ? 65536 : pending;
345                 /*memcpy64(VMEM_PTR, pptr, sz >> 3);*/
346                 memcpy(VMEM_PTR, pptr, sz);
347                 pptr += sz;
348                 pending -= sz;
349                 offs += curmode->win_64k_step;
350                 vbe_setwin(0, offs);
351         }
352         vbe_setwin(0, 0);
353 }
354
355 static uint32_t calc_mask(int sz, int pos)
356 {
357         uint32_t mask = 0;
358         while(sz-- > 0) {
359                 mask = (mask << 1) | 1;
360         }
361         return mask << pos;
362 }
363
364 #define MSR_MTRRCAP                     0xfe
365 #define MSR_MTRRDEFTYPE         0x2ff
366 #define MSR_MTRRBASE(x)         (0x200 | ((x) << 1))
367 #define MSR_MTRRMASK(x)         (0x201 | ((x) << 1))
368 #define MTRRDEF_EN                      0x800
369 #define MTRRCAP_HAVE_WC         0x400
370 #define MTRRMASK_VALID          0x800
371
372 #define MTRR_WC                         1
373
374 static int get_page_memtype(uint32_t addr, int num_ranges)
375 {
376         int i;
377         uint32_t rlow, rhigh;
378         uint32_t base, mask;
379
380         for(i=0; i<num_ranges; i++) {
381                 get_msr(MSR_MTRRMASK(i), &rlow, &rhigh);
382                 if(!(rlow & MTRRMASK_VALID)) {
383                         continue;
384                 }
385                 mask = rlow & 0xfffff000;
386
387                 get_msr(MSR_MTRRBASE(i), &rlow, &rhigh);
388                 base = rlow & 0xfffff000;
389
390                 if((addr & mask) == (base & mask)) {
391                         return rlow & 0xff;
392                 }
393         }
394
395         get_msr(MSR_MTRRDEFTYPE, &rlow, &rhigh);
396         return rlow & 0xff;
397 }
398
399 static int check_wrcomb_enabled(uint32_t addr, int len, int num_ranges)
400 {
401         while(len > 0) {
402                 if(get_page_memtype(addr, num_ranges) != MTRR_WC) {
403                         return 0;
404                 }
405                 addr += 4096;
406                 len -= 4096;
407         }
408         return 1;
409 }
410
411 static int alloc_mtrr(int num_ranges)
412 {
413         int i;
414         uint32_t rlow, rhigh;
415
416         for(i=0; i<num_ranges; i++) {
417                 get_msr(MSR_MTRRMASK(i), &rlow, &rhigh);
418                 if(!(rlow & MTRRMASK_VALID)) {
419                         return i;
420                 }
421         }
422         return -1;
423 }
424
425 static void enable_wrcomb(uint32_t addr, int len)
426 {
427         int num_ranges, mtrr;
428         uint32_t rlow, rhigh;
429         uint32_t def, mask;
430
431         if(len <= 0 || (addr | (uint32_t)len) & 0xfff) {
432                 fprintf(stderr, "failed to enable write combining, unaligned range: %p/%x\n",
433                                 (void*)addr, (unsigned int)len);
434                 return;
435         }
436
437         get_msr(MSR_MTRRCAP, &rlow, &rhigh);
438         num_ranges = rlow & 0xff;
439
440         printf("enable_wrcomb: addr=%p len=%x\n", (void*)addr, (unsigned int)len);
441
442         if(!(rlow & MTRRCAP_HAVE_WC)) {
443                 fprintf(stderr, "failed to enable write combining, processor doesn't support it\n");
444                 return;
445         }
446
447         if(check_wrcomb_enabled(addr, len, num_ranges)) {
448                 return;
449         }
450
451         if((mtrr = alloc_mtrr(num_ranges)) == -1) {
452                 fprintf(stderr, "failed to enable write combining, no free MTRRs\n");
453                 return;
454         }
455
456         mask = len - 1;
457         mask |= mask >> 1;
458         mask |= mask >> 2;
459         mask |= mask >> 4;
460         mask |= mask >> 8;
461         mask |= mask >> 16;
462         mask = ~mask & 0xfffff000;
463
464         printf("  ... mask: %08x\n", (unsigned int)mask);
465
466         _disable();
467         get_msr(MSR_MTRRDEFTYPE, &def, &rhigh);
468         set_msr(MSR_MTRRDEFTYPE, def & ~MTRRDEF_EN, rhigh);
469
470         set_msr(MSR_MTRRBASE(mtrr), addr | MTRR_WC, 0);
471         set_msr(MSR_MTRRMASK(mtrr), mask | MTRRMASK_VALID, 0);
472
473         set_msr(MSR_MTRRDEFTYPE, def | MTRRDEF_EN, 0);
474         _enable();
475 }
476
477 static const char *mtrr_names[] = { "N/A", "W C", "N/A", "N/A", "W T", "W P", "W B" };
478
479 static const char *mtrr_type_name(int type)
480 {
481         if(type < 0 || type >= sizeof mtrr_names / sizeof *mtrr_names) {
482                 return mtrr_names[0];
483         }
484         return mtrr_names[type];
485 }
486
487 static void print_mtrr(void)
488 {
489         int i, num_ranges;
490         uint32_t rlow, rhigh, base, mask;
491
492         get_msr(MSR_MTRRCAP, &rlow, &rhigh);
493         num_ranges = rlow & 0xff;
494
495         for(i=0; i<num_ranges; i++) {
496                 get_msr(MSR_MTRRBASE(i), &base, &rhigh);
497                 get_msr(MSR_MTRRMASK(i), &mask, &rhigh);
498
499                 if(mask & MTRRMASK_VALID) {
500                         printf("mtrr%d: base %p, mask %08x type %s\n", i, (void*)(base & 0xfffff000),
501                                         (unsigned int)(mask & 0xfffff000), mtrr_type_name(base & 0xff));
502                 } else {
503                         printf("mtrr%d unused (%08x/%08x)\n", i, (unsigned int)base,
504                                         (unsigned int)mask);
505                 }
506         }
507         fflush(stdout);
508 }