check alloc
[dos_imgv] / src / video.c
1 #include <stdlib.h>
2 #include <string.h>
3 #include <dos.h>
4 #include "cdpmi.h"
5 #include "video.h"
6 #include "vbe.h"
7 #include "vga.h"
8 #include "util.h"
9 #include "chkalloc.h"
10
11 #ifdef __WATCOMC__
12 #include <i86.h>
13 #define enable  _enable
14 #define disable _disable
15 #endif
16
17 #ifdef __DJGPP__
18 #define VMEM_PTR        ((void*)(0xa0000 + __djgpp_conventional_base))
19 #else
20 #define VMEM_PTR        ((void*)0xa0000)
21 #endif
22
23 #define SAME_BPP(a, b)  \
24         ((a) == (b) || ((a) == 16 && (b) == 15) || ((a) == 15 && (b) == 16) || \
25          ((a) == 32 && (b) == 24) || ((a) == 24 && (b) == 32))
26
27 void (*blit_frame)(void*, int);
28
29 int resizefb(int x, int y, int bpp, int pitch);
30
31 static void blit_frame_lfb(void *pixels, int vsync);
32 static void blit_frame_banked(void *pixels, int vsync);
33 static uint32_t calc_mask(int sz, int pos);
34
35 static void enable_wrcomb(uint32_t addr, int len);
36 static const char *mtrr_type_name(int type);
37 static void print_mtrr(void);
38
39 static struct video_mode *vmodes;
40 static int num_vmodes;
41
42 static int vbe_init_ver;
43 static struct vbe_info vbe;
44
45 /* current mode */
46 static struct video_mode *curmode;
47 static void *vpgaddr[2];
48 static int frontidx, backidx;
49 static int pgcount, pgsize, fbsize;
50
51
52 int init_video(void)
53 {
54         int i, num, max_modes;
55         struct video_mode *vmptr;
56
57         if(vbe_info(&vbe) == -1) {
58                 fprintf(stderr, "failed to retrieve VBE information\n");
59                 return -1;
60         }
61         vbe_print_info(stdout, &vbe);
62
63         num_vmodes = 0;
64         max_modes = 256;
65         if(!(vmodes = chk_malloc(max_modes * sizeof *vmodes))) {
66                 fprintf(stderr, "failed to allocate video modes list\n");
67                 return -1;
68         }
69
70         num = vbe_num_modes(&vbe);
71         for(i=0; i<num; i++) {
72                 struct vbe_mode_info minf;
73
74                 if(vbe_mode_info(vbe.modes[i], &minf) == -1) {
75                         continue;
76                 }
77
78                 if(num_vmodes >= max_modes) {
79                         int newmax = max_modes ? (max_modes << 1) : 16;
80                         if(!(vmptr = chk_realloc(vmodes, newmax * sizeof *vmodes))) {
81                                 fprintf(stderr, "failed to grow video mode list (%d)\n", newmax);
82                                 chk_free(vmodes);
83                                 return -1;
84                         }
85                         vmodes = vmptr;
86                         max_modes = newmax;
87                 }
88
89                 vmptr = vmodes + num_vmodes++;
90                 memset(vmptr, 0, sizeof *vmptr);
91                 vmptr->mode = vbe.modes[i];
92                 vmptr->xsz = minf.xres;
93                 vmptr->ysz = minf.yres;
94                 vmptr->bpp = minf.bpp;
95                 vmptr->pitch = minf.scanline_bytes;
96                 if(minf.mem_model == VBE_TYPE_DIRECT) {
97                         vmptr->rbits = minf.rsize;
98                         vmptr->gbits = minf.gsize;
99                         vmptr->bbits = minf.bsize;
100                         vmptr->rshift = minf.rpos;
101                         vmptr->gshift = minf.gpos;
102                         vmptr->bshift = minf.bpos;
103                         vmptr->rmask = calc_mask(minf.rsize, minf.rpos);
104                         vmptr->gmask = calc_mask(minf.gsize, minf.gpos);
105                         vmptr->bmask = calc_mask(minf.bsize, minf.bpos);
106                         /*vmptr->bpp = vmptr->rbits + vmptr->gbits + vmptr->bbits;*/
107                 }
108 #ifndef DBG_NOLFB
109                 if(minf.attr & VBE_ATTR_LFB) {
110                         vmptr->fb_addr = minf.fb_addr;
111                 }
112 #endif
113                 vmptr->max_pages = minf.num_img_pages;
114                 vmptr->win_gran = minf.win_gran;
115
116                 printf("%04x: ", vbe.modes[i]);
117                 vbe_print_mode_info(stdout, &minf);
118         }
119         fflush(stdout);
120
121         vbe_init_ver = VBE_VER_MAJOR(vbe.ver);
122         return 0;
123 }
124
125 void cleanup_video(void)
126 {
127         chk_free(vmodes);
128 }
129
130 struct video_mode *video_modes(void)
131 {
132         return vmodes;
133 }
134
135 int num_video_modes(void)
136 {
137         return num_vmodes;
138 }
139
140 struct video_mode *get_video_mode(int idx)
141 {
142         if(idx == VMODE_CURRENT) {
143                 return curmode;
144         }
145         return vmodes + idx;
146 }
147
148 int match_video_mode(int xsz, int ysz, int bpp)
149 {
150         int i, best = -1;
151         struct video_mode *vm;
152
153         for(i=0; i<num_vmodes; i++) {
154                 vm = vmodes + i;
155                 if(vm->xsz != xsz || vm->ysz != ysz) continue;
156                 if(SAME_BPP(vm->bpp, bpp)) {
157                         best = i;
158                 }
159                 if(vm->bpp == bpp) break;
160         }
161
162         if(best == -1) {
163                 fprintf(stderr, "failed to find video mode %dx%d %d bpp)\n", xsz, ysz, bpp);
164                 return -1;
165         }
166         return best;
167 }
168
169 int find_video_mode(int mode)
170 {
171         int i;
172         struct video_mode *vm;
173
174         vm = vmodes;
175         for(i=0; i<num_vmodes; i++) {
176                 if(vm->mode == mode) return i;
177                 vm++;
178         }
179         return -1;
180 }
181
182 void *set_video_mode(int idx, int nbuf)
183 {
184         unsigned int mode;
185         struct video_mode *vm = vmodes + idx;
186         struct cpuid_info cpu;
187
188         if(curmode == vm) return vpgaddr[0];
189
190         printf("setting video mode %x (%dx%d %d bpp)\n", (unsigned int)vm->mode,
191                         vm->xsz, vm->ysz, vm->bpp);
192         fflush(stdout);
193
194 #ifndef DBG_NOLFB
195         mode = vm->mode | VBE_MODE_LFB;
196         if(vbe_setmode(mode) == -1) {
197 #endif
198                 mode = vm->mode;
199                 if(vbe_setmode(mode) == -1) {
200                         fprintf(stderr, "failed to set video mode %x\n", (unsigned int)vm->mode);
201                         return 0;
202                 }
203                 printf("Warning: failed to get a linear framebuffer. falling back to banked mode\n");
204 #ifndef DBG_NOLFB
205         }
206 #endif
207
208         /* unmap previous video memory mapping, if there was one (switching modes) */
209         if(vpgaddr[0] && vpgaddr[0] != VMEM_PTR) {
210                 dpmi_munmap(vpgaddr[0]);
211                 vpgaddr[0] = vpgaddr[1] = 0;
212         }
213
214         curmode = vm;
215         if(nbuf < 1) nbuf = 1;
216         if(nbuf > 2) nbuf = 2;
217         pgcount = nbuf > vm->max_pages + 1 ? vm->max_pages + 1 : nbuf;
218         pgsize = vm->ysz * vm->pitch;
219         fbsize = pgcount * pgsize;
220
221         if(vm->bpp > 8) {
222                 printf("rgb mask: %x %x %x\n", (unsigned int)vm->rmask,
223                                 (unsigned int)vm->gmask, (unsigned int)vm->bmask);
224                 printf("rgb shift: %d %d %d\n", vm->rshift, vm->gshift, vm->bshift);
225         }
226         printf("pgcount: %d, pgsize: %d, fbsize: %d\n", pgcount, pgsize, fbsize);
227         if(vm->fb_addr) {
228                 printf("phys addr: %p\n", (void*)vm->fb_addr);
229         }
230         fflush(stdout);
231
232         if(vm->fb_addr) {
233                 vpgaddr[0] = (void*)dpmi_mmap(vm->fb_addr, fbsize);
234                 if(!vpgaddr[0]) {
235                         fprintf(stderr, "failed to map framebuffer (phys: %lx, size: %d)\n",
236                                         (unsigned long)vm->fb_addr, fbsize);
237                         set_text_mode();
238                         return 0;
239                 }
240                 memset(vpgaddr[0], 0xaa, pgsize);
241
242                 if(pgcount > 1) {
243                         vpgaddr[1] = (char*)vpgaddr[0] + pgsize;
244                         backidx = 1;
245                         page_flip(FLIP_NOW);    /* start with the second page visible */
246                 } else {
247                         frontidx = backidx = 0;
248                         vpgaddr[1] = 0;
249                 }
250
251                 blit_frame = blit_frame_lfb;
252
253 #ifdef ENABLE_WRCOMB
254                 if(read_cpuid(&cpu) != -1 && cpu.feat & CPUID_FEAT_MTRR) {
255                         uint32_t len = (uint32_t)vbe.vmem_blk << 16;
256
257                         /* if vmem_blk is 0 or if the reported size is absurd (more than
258                          * 256mb), just use the framebuffer size for this mode to setup the
259                          * mtrr
260                          */
261                         if(!len || len > 0x10000000) {
262                                 printf("reported vmem too large or overflowed, using fbsize for wrcomb setup\n");
263                                 len = fbsize;
264                         }
265                         print_mtrr();
266                         enable_wrcomb(vm->fb_addr, len);
267                 }
268 #endif
269
270         } else {
271                 vpgaddr[0] = VMEM_PTR;
272                 if(pgcount > 1) {
273                         vpgaddr[1] = VMEM_PTR;
274                         backidx = 1;
275                         page_flip(FLIP_NOW);    /* start with the second page visible */
276                 } else {
277                         frontidx = backidx = 0;
278                         vpgaddr[1] = 0;
279                 }
280
281                 blit_frame = blit_frame_banked;
282
283                 /* calculate window granularity shift */
284                 vm->win_gran_shift = 0;
285                 vm->win_64k_step = 1;
286                 if(vm->win_gran > 0 && vm->win_gran < 64) {
287                         int gran = vm->win_gran;
288                         while(gran < 64) {
289                                 vm->win_gran_shift++;
290                                 gran <<= 1;
291                         }
292                         vm->win_64k_step = 1 << vm->win_gran_shift;
293                 }
294
295                 printf("granularity: %dk (step: %d)\n", vm->win_gran, vm->win_64k_step);
296         }
297
298         fflush(stdout);
299         return vpgaddr[0];
300 }
301
302 int set_text_mode(void)
303 {
304         /* unmap previous video memory mapping, if there was one (switching modes) */
305         if(vpgaddr[0] && vpgaddr[0] != VMEM_PTR) {
306                 dpmi_munmap(vpgaddr[0]);
307                 vpgaddr[0] = vpgaddr[1] = 0;
308         }
309
310         vga_setmode(3);
311         curmode = 0;
312         return 0;
313 }
314
315 void *page_flip(int vsync)
316 {
317         if(!vpgaddr[1]) {
318                 /* page flipping not supported */
319                 return vpgaddr[0];
320         }
321
322         vbe_swap(backidx ? pgsize : 0, vsync ? VBE_SWAP_VBLANK : VBE_SWAP_NOW);
323         frontidx = backidx;
324         backidx = (backidx + 1) & 1;
325
326         return vpgaddr[backidx];
327 }
328
329
330 static void blit_frame_lfb(void *pixels, int vsync)
331 {
332         if(vsync) wait_vsync();
333         memcpy64(vpgaddr[frontidx], pixels, pgsize >> 3);
334 }
335
336 static void blit_frame_banked(void *pixels, int vsync)
337 {
338         int sz, offs, pending;
339         unsigned char *pptr = pixels;
340
341         if(vsync) wait_vsync();
342
343         /* assume initial window offset at 0 */
344         offs = 0;
345         pending = pgsize;
346         while(pending > 0) {
347                 sz = pending > 65536 ? 65536 : pending;
348                 /*memcpy64(VMEM_PTR, pptr, sz >> 3);*/
349                 memcpy(VMEM_PTR, pptr, sz);
350                 pptr += sz;
351                 pending -= sz;
352                 offs += curmode->win_64k_step;
353                 vbe_setwin(0, offs);
354         }
355         vbe_setwin(0, 0);
356 }
357
358 static uint32_t calc_mask(int sz, int pos)
359 {
360         uint32_t mask = 0;
361         while(sz-- > 0) {
362                 mask = (mask << 1) | 1;
363         }
364         return mask << pos;
365 }
366
367 #ifdef __GNUC__
368 #define get_msr(msr, low, high) \
369         asm volatile( \
370                 "\r\trdmsr" \
371                 : "=a"(low), "=d"(high) \
372                 : "c"(msr))
373
374 #define set_msr(msr, low, high) \
375         asm volatile( \
376                 "\r\twrmsr" \
377                 :: "c"(msr), "a"(low), "d"(high))
378
379 #endif  /* __GNUC__ */
380
381 #ifdef __WATCOMC__
382 #define get_msr(msr, low, high) get_msr_asm(msr, &low, &high)
383
384 void get_msr_asm(uint32_t msr, uint32_t *lowptr, uint32_t *highptr);
385 #pragma aux get_msr_asm = \
386         "rdmsr" \
387         "mov [ebx], eax" \
388         "mov [esi], edx" \
389         parm [ecx][ebx][esi] \
390         modify [eax]
391
392 void set_msr(uint32_t msr, uint32_t low, uint32_t high);
393 #pragma aux set_msr = \
394         "wrmsr" \
395         parm [ecx][eax][edx]
396
397 #endif  /* __WATCOMC__ */
398
399
400 #define MSR_MTRRCAP                     0xfe
401 #define MSR_MTRRDEFTYPE         0x2ff
402 #define MSR_MTRRBASE(x)         (0x200 | ((x) << 1))
403 #define MSR_MTRRMASK(x)         (0x201 | ((x) << 1))
404 #define MTRRDEF_EN                      0x800
405 #define MTRRCAP_HAVE_WC         0x400
406 #define MTRRMASK_VALID          0x800
407
408 #define MTRR_WC                         1
409
410 static int get_page_memtype(uint32_t addr, int num_ranges)
411 {
412         int i;
413         uint32_t rlow, rhigh;
414         uint32_t base, mask;
415
416         for(i=0; i<num_ranges; i++) {
417                 get_msr(MSR_MTRRMASK(i), rlow, rhigh);
418                 if(!(rlow & MTRRMASK_VALID)) {
419                         continue;
420                 }
421                 mask = rlow & 0xfffff000;
422
423                 get_msr(MSR_MTRRBASE(i), rlow, rhigh);
424                 base = rlow & 0xfffff000;
425
426                 if((addr & mask) == (base & mask)) {
427                         return rlow & 0xff;
428                 }
429         }
430
431         get_msr(MSR_MTRRDEFTYPE, rlow, rhigh);
432         return rlow & 0xff;
433 }
434
435 static int check_wrcomb_enabled(uint32_t addr, int len, int num_ranges)
436 {
437         while(len > 0) {
438                 if(get_page_memtype(addr, num_ranges) != MTRR_WC) {
439                         return 0;
440                 }
441                 addr += 4096;
442                 len -= 4096;
443         }
444         return 1;
445 }
446
447 static int alloc_mtrr(int num_ranges)
448 {
449         int i;
450         uint32_t rlow, rhigh;
451
452         for(i=0; i<num_ranges; i++) {
453                 get_msr(MSR_MTRRMASK(i), rlow, rhigh);
454                 if(!(rlow & MTRRMASK_VALID)) {
455                         return i;
456                 }
457         }
458         return -1;
459 }
460
461 static void enable_wrcomb(uint32_t addr, int len)
462 {
463         int num_ranges, mtrr;
464         uint32_t rlow, rhigh;
465         uint32_t def, mask;
466
467         if(len <= 0 || (addr | (uint32_t)len) & 0xfff) {
468                 fprintf(stderr, "failed to enable write combining, unaligned range: %p/%x\n",
469                                 (void*)addr, (unsigned int)len);
470                 return;
471         }
472
473         get_msr(MSR_MTRRCAP, rlow, rhigh);
474         num_ranges = rlow & 0xff;
475
476         printf("enable_wrcomb: addr=%p len=%x\n", (void*)addr, (unsigned int)len);
477
478         if(!(rlow & MTRRCAP_HAVE_WC)) {
479                 fprintf(stderr, "failed to enable write combining, processor doesn't support it\n");
480                 return;
481         }
482
483         if(check_wrcomb_enabled(addr, len, num_ranges)) {
484                 return;
485         }
486
487         if((mtrr = alloc_mtrr(num_ranges)) == -1) {
488                 fprintf(stderr, "failed to enable write combining, no free MTRRs\n");
489                 return;
490         }
491
492         mask = len - 1;
493         mask |= mask >> 1;
494         mask |= mask >> 2;
495         mask |= mask >> 4;
496         mask |= mask >> 8;
497         mask |= mask >> 16;
498         mask = ~mask & 0xfffff000;
499
500         printf("  ... mask: %08x\n", (unsigned int)mask);
501
502         disable();
503         get_msr(MSR_MTRRDEFTYPE, def, rhigh);
504         set_msr(MSR_MTRRDEFTYPE, def & ~MTRRDEF_EN, rhigh);
505
506         set_msr(MSR_MTRRBASE(mtrr), addr | MTRR_WC, 0);
507         set_msr(MSR_MTRRMASK(mtrr), mask | MTRRMASK_VALID, 0);
508
509         set_msr(MSR_MTRRDEFTYPE, def | MTRRDEF_EN, 0);
510         enable();
511 }
512
513 static const char *mtrr_names[] = { "N/A", "W C", "N/A", "N/A", "W T", "W P", "W B" };
514
515 static const char *mtrr_type_name(int type)
516 {
517         if(type < 0 || type >= sizeof mtrr_names / sizeof *mtrr_names) {
518                 return mtrr_names[0];
519         }
520         return mtrr_names[type];
521 }
522
523 static void print_mtrr(void)
524 {
525         int i, num_ranges;
526         uint32_t rlow, rhigh, base, mask;
527
528         get_msr(MSR_MTRRCAP, rlow, rhigh);
529         num_ranges = rlow & 0xff;
530
531         for(i=0; i<num_ranges; i++) {
532                 get_msr(MSR_MTRRBASE(i), base, rhigh);
533                 get_msr(MSR_MTRRMASK(i), mask, rhigh);
534
535                 if(mask & MTRRMASK_VALID) {
536                         printf("mtrr%d: base %p, mask %08x type %s\n", i, (void*)(base & 0xfffff000),
537                                         (unsigned int)(mask & 0xfffff000), mtrr_type_name(base & 0xff));
538                 } else {
539                         printf("mtrr%d unused (%08x/%08x)\n", i, (unsigned int)base,
540                                         (unsigned int)mask);
541                 }
542         }
543         fflush(stdout);
544 }