+ .code16
+unreal:
+ # use the same GDT above, will use data segment: 2
+ lgdt (gdt_lim)
+
+ mov %cr0, %eax
+ or $1, %ax
+ mov %eax, %cr0
+ jmp 0f
+
+0: mov $0x10, %ax
+ mov %ax, %ds
+ mov %ax, %es
+ mov %ax, %fs
+ mov %ax, %gs
+ mov %ax, %ss
+
+ mov %cr0, %eax
+ and $0xfffe, %ax
+ mov %eax, %cr0
+
+ xor %ax, %ax
+ mov %ax, %ds
+ mov %ax, %es
+ mov %ax, %fs
+ mov %ax, %gs
+ mov %ax, %ss
+ ret
+
+mainsz_msg: .asciz "Main program size: "
+mainsz_msg2: .asciz " ("
+mainsz_msg3: .asciz " sectors)\n"
+
+first_sect: .long 0
+sect_left: .long 0
+cur_track: .long 0
+trk_sect: .long 0
+dest_ptr: .long 0
+
+load_main:
+ movl $main_load_addr, dest_ptr
+
+ # calculate first sector
+ mov $_boot2_size, %eax
+ add $511, %eax
+ shr $9, %eax
+ # add 1 to account for the boot sector
+ inc %eax
+ mov %eax, first_sect
+
+ # calculate the first track (first_sect / sect_per_track)
+ movzxw sect_per_track, %ecx
+ xor %edx, %edx
+ div %ecx
+ mov %eax, cur_track
+ # remainder is sector within track
+ mov %edx, trk_sect
+
+ mov $mainsz_msg, %esi
+ call putstr
+ mov $_main_size, %eax
+ mov %eax, %ecx
+ call print_num
+
+ mov $mainsz_msg2, %esi
+ call putstr
+
+ # calculate sector count
+ add $511, %eax
+ shr $9, %eax
+ mov %eax, sect_left
+
+ call print_num
+ mov $mainsz_msg3, %esi
+ call putstr
+
+ # read a whole track into the buffer (or partial first track)
+ldloop:
+ movzxw sect_per_track, %ecx
+ sub trk_sect, %ecx
+ push %ecx
+ call read_track
+
+ # debug: print the first 32bits of the track
+ #mov buffer, %eax
+ #call print_num
+ #mov $10, %al
+ #call putchar
+
+ # copy to high memory
+ mov $buffer, %esi
+ mov dest_ptr, %edi
+ mov (%esp), %ecx
+ shl $9, %ecx
+ add %ecx, dest_ptr
+ shr $2, %ecx
+ addr32 rep movsl
+
+ incl cur_track
+ # other than the first track which might be partial, all the rest start from 0
+ movl $0, trk_sect
+
+ pop %ecx
+ sub %ecx, sect_left
+ ja ldloop
+
+ # the BIOS might have enabled interrupts
+ cli
+
+ # if we were loaded from floppy, turn all floppy motors off
+ movb drive_number, %bl
+ and $0x80, %bl
+ jnz 0f
+ mov $0x3f2, %dx
+ in %dx, %al
+ and $0xf, %al
+ out %al, %dx
+0:
+
+ mov $10, %ax
+ call putchar
+
+ ret
+
+rdtrk_msg: .asciz "Reading track: "
+rdcyl_msg: .asciz " - cyl: "
+rdhead_msg: .asciz " head: "
+rdsect_msg: .asciz " start sect: "
+rdlast_msg: .asciz " ... "
+rdok_msg: .asciz "OK\n"
+rdfail_msg: .asciz "failed\n"
+
+read_retries: .short 0
+
+read_track:
+ # set es to the start of the destination buffer to allow reading in
+ # full 64k chunks if necessary
+ mov $buffer, %bx
+ shr $4, %bx
+ mov %bx, %es
+ xor %ebx, %ebx
+
+ movw $3, read_retries
+
+read_try:
+ # print track
+ mov $rdtrk_msg, %esi
+ call putstr
+ mov cur_track, %eax
+ call print_num
+ mov $rdcyl_msg, %esi
+ call putstr
+
+ # calc cylinder (cur_track / num_heads) and head (cur_track % num_heads)
+ mov cur_track, %eax
+ movzxw num_heads, %ecx
+ xor %edx, %edx
+ div %ecx
+
+ # print cylinder
+ push %eax
+ call print_num
+ # print head
+ mov $rdhead_msg, %esi
+ call putstr
+ movzx %dx, %eax
+ call print_num
+ pop %eax
+
+ # head in dh
+ mov %dl, %dh
+
+ # cylinder low byte at ch and high bits at cl[7, 6]
+ mov %al, %ch
+ mov %ah, %cl
+ and $3, %cl
+ ror $2, %cl
+
+ # print start sector
+ mov $rdsect_msg, %esi
+ call putstr
+ mov trk_sect, %eax
+ call print_num
+ mov $rdlast_msg, %esi
+ call putstr
+
+ # start sector (1-based) in cl[0, 5]
+ mov trk_sect, %al
+ inc %al
+ and $0x3f, %al
+ or %al, %cl
+
+ # number of sectors in al
+ mov 2(%esp), %ax
+ # call number (2) in ah
+ mov $2, %ah
+ # drive number in dl
+ movb drive_number, %dl
+ int $0x13
+ jnc read_ok
+
+ # abort after 3 attempts
+ decw read_retries
+ jz read_fail
+
+ # error, reset controller and retry
+ xor %ah, %ah
+ int $0x13
+ jmp read_try
+
+read_fail:
+ mov $rdfail_msg, %esi
+ call putstr
+ jmp abort_read
+
+read_ok:
+ mov $rdok_msg, %esi
+ call putstr
+
+ # reset es to 0 before returning
+ xor %ax, %ax
+ mov %ax, %es
+ ret
+
+str_read_error: .asciz "Read error while reading track: "
+
+abort_read:
+ mov $str_read_error, %esi
+ call putstr
+ mov cur_track, %eax
+ call print_num
+ mov $10, %al
+ call putchar
+
+ cli
+0: hlt
+ jmp 0b
+
+
+ # better print routines, since we're not constrainted by the 512b of
+ # the boot sector.
+ .global cursor_x
+ .global cursor_y
+cursor_x: .long 0
+cursor_y: .long 0
+
+putchar:
+ pushal
+ call ser_putchar
+
+ cmp $10, %al
+ jnz 0f
+ call video_newline
+ jmp 1f
+
+0: push %eax
+ mov cursor_y, %eax
+ mov $80, %ecx
+ mul %ecx
+ add cursor_x, %eax
+ mov %eax, %ebx
+ pop %eax
+
+ mov $0xb8000, %edx
+
+ # this looks retarded. in nasm: [ebx * 2 + edx]
+ mov %al, (%edx, %ebx, 2)
+ movb $7, 1(%edx, %ebx, 2)
+ incl cursor_x
+ cmpl $80, cursor_x
+ jnz 1f
+ call video_newline
+
+1: popal
+ ret
+
+ # expects string pointer in esi
+putstr:
+ mov (%esi), %al
+ cmp $0, %al
+ jz 0f
+ call putchar
+ inc %esi
+ jmp putstr
+0: ret
+
+ # expects number in eax
+print_num:
+ # save registers
+ pushal
+
+ mov $numbuf + 16, %esi
+ movb $0, (%esi)
+ mov $10, %ebx
+convloop:
+ xor %edx, %edx
+ div %ebx
+ add $48, %dl
+ dec %esi
+ mov %dl, (%esi)
+ cmp $0, %eax
+ jnz convloop
+
+ call putstr
+
+ # restore regs
+ popal
+ ret
+
+
+video_newline:
+ movl $0, cursor_x
+ incl cursor_y
+ cmpl $25, cursor_y
+ jnz 0f
+ call scrollup
+ decl cursor_y
+0: ret
+
+scrollup:
+ pushal
+ # move 80 * 24 lines from b80a0 -> b8000
+ mov $0xb8000, %edi
+ mov $0xb80a0, %esi
+ mov $960, %ecx
+ addr32 rep movsl
+ # clear last line (b8f00)
+ mov $0xb8f00, %edi
+ xor %eax, %eax
+ mov $40, %ecx
+ addr32 rep stosl
+ popal
+ ret
+
+clearscr:
+ mov $0xb8000, %edi
+ # clear with white-on-black spaces
+ mov $0x07200720, %eax
+ mov $1000, %ecx
+ addr32 rep stosl
+ ret
+
+ .set UART_DATA, 0x3f8
+ .set UART_DIVLO, 0x3f8
+ .set UART_DIVHI, 0x3f9
+ .set UART_FIFO, 0x3fa
+ .set UART_LCTL, 0x3fb
+ .set UART_MCTL, 0x3fc
+ .set UART_LSTAT, 0x3fd
+ .set DIV_9600, 115200 / 9600
+ .set LCTL_8N1, 0x03
+ .set LCTL_DLAB, 0x80
+ .set FIFO_ENABLE_CLEAR, 0x07
+ .set MCTL_DTR_RTS_OUT2, 0x0b
+ .set LST_TREG_EMPTY, 0x20
+
+setup_serial:
+ # set clock divisor
+ mov $LCTL_DLAB, %al
+ mov $UART_LCTL, %dx
+ out %al, %dx
+ mov $DIV_9600, %ax
+ mov $UART_DIVLO, %dx
+ out %al, %dx
+ shr $8, %ax
+ mov $UART_DIVHI, %dx
+ out %al, %dx
+ # set format 8n1
+ mov $LCTL_8N1, %al
+ mov $UART_LCTL, %dx
+ out %al, %dx
+ # clear and enable fifo
+ mov $FIFO_ENABLE_CLEAR, %al
+ mov $UART_FIFO, %dx
+ out %al, %dx
+ # assert RTS and DTR
+ mov $MCTL_DTR_RTS_OUT2, %al
+ mov $UART_MCTL, %dx
+ out %al, %dx
+ ret
+
+
+ser_putchar:
+ push %dx
+
+ cmp $10, %al
+ jnz 0f
+ push %ax
+ mov $13, %al
+ call ser_putchar
+ pop %ax
+
+0: mov %al, %ah
+ # wait until the transmit register is empty
+ mov $UART_LSTAT, %dx
+wait: in %dx, %al
+ and $LST_TREG_EMPTY, %al
+ jz wait
+ mov $UART_DATA, %dx
+ mov %ah, %al
+ out %al, %dx
+
+ pop %dx
+ ret
+
+
+
+ena20_msg: .asciz "A20 line enabled\n"
+
+enable_a20:
+ call test_a20
+ jnc a20done
+ call enable_a20_kbd
+ call test_a20
+ jnc a20done
+ call enable_a20_fast
+ call test_a20
+ jnc a20done
+ # keep trying ... we can't do anything useful without A20 anyway
+ jmp enable_a20
+a20done:
+ mov $ena20_msg, %esi
+ call putstr
+ ret
+
+ # CF = 1 if A20 test fails (not enabled)
+test_a20:
+ mov $0x07c000, %ebx
+ mov $0x17c000, %edx
+ movl $0xbaadf00d, (%ebx)
+ movl $0xaabbcc42, (%edx)
+ subl $0xbaadf00d, (%ebx)
+ ret
+
+ # enable A20 line through port 0x92 (fast A20)
+enable_a20_fast:
+ mov $ena20_fast_msg, %esi
+ call putstr
+
+ in $0x92, %al
+ or $2, %al
+ out %al, $0x92
+ ret
+
+ena20_fast_msg: .asciz "Attempting fast A20 enable\n"
+
+
+ # enable A20 line through the keyboard controller
+ .set KBC_DATA_PORT, 0x60
+ .set KBC_CMD_PORT, 0x64
+ .set KBC_STATUS_PORT, 0x64
+ .set KBC_CMD_RD_OUTPORT, 0xd0
+ .set KBC_CMD_WR_OUTPORT, 0xd1
+
+ .set KBC_STAT_OUT_RDY, 0x01
+ .set KBC_STAT_IN_FULL, 0x02
+
+enable_a20_kbd:
+ mov $ena20_kbd_msg, %esi
+ call putstr
+
+ call kbc_wait_write
+ mov $KBC_CMD_WR_OUTPORT, %al
+ out %al, $KBC_CMD_PORT
+ call kbc_wait_write
+ mov $0xdf, %al
+ out %al, $KBC_DATA_PORT
+ ret
+
+ena20_kbd_msg: .asciz "Attempting KBD A20 enable\n"
+
+ # wait until the keyboard controller is ready to accept another byte
+kbc_wait_write:
+ in $KBC_STATUS_PORT, %al
+ and $KBC_STAT_IN_FULL, %al
+ jnz kbc_wait_write