5 Commits

Author SHA1 Message Date
507b4f5511 Merge pull request #89 from vmttmv/fix/bl-bounds
Establish well-defined read buffers for bl, implement error printing
2026-01-07 21:00:00 -08:00
Borna Šoštarić
12046ce96b fix vga clear section in on_error 2026-01-08 05:20:42 +01:00
vmttmv
a9b8ac7066 Establish well-defined read buffers for bl, implement error printing 2026-01-07 02:33:46 +02:00
d6ab8c91f8 Merge pull request #87 from vmttmv/fix/bl-nonaligned-reads
Fix non-aligned disk reads in bootloader
2026-01-05 17:45:37 -08:00
vmttmv
35ebd5fd72 Fix non-aligned disk reads in bootloader 2026-01-06 00:44:55 +02:00
3 changed files with 179 additions and 145 deletions

View File

@@ -24,84 +24,3 @@ _start:
call load_kernel call load_kernel
jmp eax jmp eax
; ----------------------------------------------------------------------------
; ATA read sectors (LBA mode)
;
; sysv32 abi signature:
; void ata_lba_read(uint32_t lba, uint8_t nsect, void *addr);
; ----------------------------------------------------------------------------
ata_lba_read:
push ebp
mov ebp, esp
push ebx
push ecx
push edx
push edi
; Wait BSY=0 before proceeding to write the regs
.wait_rdy:
mov edx, 0x1F7
in al, dx
test al, 0x80
jnz .wait_rdy
mov eax, [ebp+8] ; arg #1 = LBA
mov cl, [ebp+12] ; arg #2 = # of sectors
mov edi, [ebp+16] ; arg #3 = buffer address
and eax, 0x0FFFFFFF
mov ebx, eax ; Save LBA in RBX
mov edx, 0x01F6 ; Port to send drive and bit 24 - 27 of LBA
shr eax, 24 ; Get bit 24 - 27 in al
or al, 11100000b ; Set bit 6 in al for LBA mode
out dx, al
mov edx, 0x01F2 ; Port to send number of sectors
mov al, cl ; Get number of sectors from CL
out dx, al
mov edx, 0x1F3 ; Port to send bit 0 - 7 of LBA
mov eax, ebx ; Get LBA from EBX
out dx, al
mov edx, 0x1F4 ; Port to send bit 8 - 15 of LBA
mov eax, ebx ; Get LBA from EBX
shr eax, 8 ; Get bit 8 - 15 in AL
out dx, al
mov edx, 0x1F5 ; Port to send bit 16 - 23 of LBA
mov eax, ebx ; Get LBA from EBX
shr eax, 16 ; Get bit 16 - 23 in AL
out dx, al
mov edx, 0x1F7 ; Command port
mov al, 0x20 ; Read with retry.
out dx, al
mov bl, cl ; Save # of sectors in BL
.wait_rdy2:
mov edx, 0x1F7
.do_wait_rdy2:
in al, dx
test al, 0x80 ; BSY?
jnz .do_wait_rdy2
test al, 0x8 ; DRQ?
jz .do_wait_rdy2
mov edx, 0x1F0 ; Data port, in and out
mov ecx, 256
rep insw ; in to [RDI]
dec bl ; are we...
jnz .wait_rdy2 ; ...done?
pop edi
pop edx
pop ecx
pop ebx
pop ebp
ret

View File

@@ -9,6 +9,4 @@ SECTIONS {
*(.bss*) *(.bss*)
*(COMMON) *(COMMON)
} }
read_buf = .;
} }

View File

@@ -1,5 +1,20 @@
#include <stddef.h>
#include <stdint.h> #include <stdint.h>
// ATA IO Ports
#define ATA_PRIMARY_DATA 0x1F0
#define ATA_PRIMARY_ERR_FEATURES 0x1F1
#define ATA_PRIMARY_SEC_COUNT 0x1F2
#define ATA_PRIMARY_LBA_LOW 0x1F3
#define ATA_PRIMARY_LBA_MID 0x1F4
#define ATA_PRIMARY_LBA_HIGH 0x1F5
#define ATA_PRIMARY_DRIVE_SEL 0x1F6
#define ATA_PRIMARY_COMM_STAT 0x1F7
// ATA Commands
#define ATA_CMD_READ_PIO 0x20
#define ATA_CMD_WRITE_PIO 0x30
// ELF Ident indexes // ELF Ident indexes
#define EI_NIDENT 16 #define EI_NIDENT 16
@@ -7,6 +22,19 @@
#define PT_NULL 0 #define PT_NULL 0
#define PT_LOAD 1 #define PT_LOAD 1
// Disk sector size
#define SECTOR_SIZE 512
#define PH_PER_SECTOR (SECTOR_SIZE / sizeof(Elf32_Phdr))
// Kernel start LBA
#define KERN_START_SECT 5
// VGA
// Expects bios initialization for text mode (3), buffer at 0xb8000
#define VGA_ADDRESS 0xB8000
#define VGA_COLS 80
#define VGA_ROWS 25
// ELF Header (32-bit) // ELF Header (32-bit)
typedef struct { typedef struct {
uint8_t e_ident[EI_NIDENT]; uint8_t e_ident[EI_NIDENT];
@@ -37,82 +65,171 @@ typedef struct {
uint32_t p_align; uint32_t p_align;
} __attribute__((packed)) Elf32_Phdr; } __attribute__((packed)) Elf32_Phdr;
static inline uint8_t inb(uint16_t port)
{
uint8_t ret;
__asm__ volatile ("inb %1, %0"
: "=a"(ret)
: "Nd"(port));
return ret;
}
static inline void outb(uint16_t port, uint8_t val)
{
__asm__ volatile ("outb %0, %1"
:
: "a"(val), "Nd"(port));
}
static inline uint16_t inw(uint16_t port)
{
uint16_t ret;
__asm__ volatile ("inw %1, %0"
: "=a"(ret)
: "Nd"(port));
return ret;
}
static inline void ata_wait_bsy() {
while (inb(ATA_PRIMARY_COMM_STAT) & 0x80);
}
static inline void ata_wait_drq() {
while (!(inb(ATA_PRIMARY_COMM_STAT) & 0x08));
}
static void ata_read_sector(void *addr, uint32_t lba) {
ata_wait_bsy();
outb(ATA_PRIMARY_DRIVE_SEL, 0xE0 | ((lba >> 24) & 0x0F));
outb(ATA_PRIMARY_SEC_COUNT, 1);
outb(ATA_PRIMARY_LBA_LOW, (uint8_t)lba);
outb(ATA_PRIMARY_LBA_MID, (uint8_t)(lba >> 8));
outb(ATA_PRIMARY_LBA_HIGH, (uint8_t)(lba >> 16));
outb(ATA_PRIMARY_COMM_STAT, ATA_CMD_READ_PIO);
uint16_t* ptr = (uint16_t*)addr;
ata_wait_bsy();
ata_wait_drq();
for (int i = 0; i < 256; i++) {
*ptr++ = inw(ATA_PRIMARY_DATA);
}
}
static void ata_read_sectors(uint8_t *addr, uint32_t offset, uint32_t size)
{
// Reads are offset from the starting sector of the kernel
uint32_t lba = KERN_START_SECT + offset / SECTOR_SIZE;
uint32_t off = offset % 512;
uint8_t data[512];
while (size > 0) {
ata_read_sector(data, lba);
uint32_t copy = 512 - off;
if (copy > size) {
copy = size;
}
for (uint32_t i = 0; i < copy; i++) {
addr[i] = data[off + i];
}
addr += copy;
size -= copy;
lba++;
off = 0;
}
}
static void on_error(const char *msg)
{
uint16_t *ptr = (uint16_t *)VGA_ADDRESS;
// Clear
uint16_t val = 0x0f00 | (uint8_t)' ';
for (size_t i = 0; i < VGA_COLS * VGA_ROWS; i++) {
ptr[i] = val;
}
// Print error
for (size_t i = 0; msg[i]; i++) {
ptr[i] = 0xf00 | (uint8_t)msg[i];
}
// Halt
while (1) {
__asm__("hlt");
}
}
// Load an ELF executable into memory. // Load an ELF executable into memory.
static int elf_load(const void* data, void (*load_segment)(uint8_t *vaddr, uint32_t src, uint32_t size)) { // NOTE: Only 32-byte program headers are supported.
const Elf32_Ehdr* header = (const Elf32_Ehdr*)data; // Returns the entry point to the program.
const Elf32_Phdr* ph = (const Elf32_Phdr*)((uint8_t*)data + header->e_phoff); static void *elf_load(const void *data) {
const Elf32_Ehdr *header = (const Elf32_Ehdr*)data;
if (header->e_phentsize != sizeof(Elf32_Phdr)) {
// The bootloader only handles 32-byte program header entries
on_error("ERROR: Unsupported program header entry size, halting...");
}
// Buffer for the program headers
uint8_t file_buf[SECTOR_SIZE];
// Current file offset to the next program header
uint32_t file_offset = header->e_phoff;
for (int i = 0; i < header->e_phnum; i++) { for (int i = 0; i < header->e_phnum; i++) {
if (ph[i].p_type != PT_LOAD) // Check for sector boundary.
// Program headers are read in a sector at a time
// 512 / 32 = 16 PH per sector
if (i % PH_PER_SECTOR == 0) {
uint32_t count = (header->e_phnum - i) * sizeof(Elf32_Phdr);
if (count > SECTOR_SIZE) {
count = SECTOR_SIZE;
}
// Reads
ata_read_sectors(file_buf, file_offset, count);
file_offset += count;
}
// PH being processed currently, index mod 16 as headers
// are being loaded in sector by sector.
const Elf32_Phdr *ph = (const Elf32_Phdr *)file_buf + (i % PH_PER_SECTOR);
// Discard non-load segments
if (ph->p_type != PT_LOAD)
continue; continue;
uint32_t offset = ph[i].p_offset; // Load in the segment
uint32_t vaddr = ph[i].p_vaddr; uint32_t offset = ph->p_offset;
uint32_t filesz = ph[i].p_filesz; uint32_t filesz = ph->p_filesz;
uint32_t memsz = ph[i].p_memsz; uint32_t memsz = ph->p_memsz;
uint8_t *vaddr = (uint8_t *)ph->p_vaddr;
// Copy data segment ata_read_sectors(vaddr, offset, filesz);
//load_segment((uint8_t *)vaddr, offset, filesz);
load_segment((uint8_t *)vaddr, offset, filesz);
// Zero remaining BSS (if any) // Zero remaining BSS (if any)
if (memsz > filesz) { if (memsz > filesz) {
uint8_t* bss_start = (uint8_t*)(vaddr + filesz); uint8_t* bss_start = vaddr + filesz;
for (uint32_t j = 0; j < memsz - filesz; j++) { for (uint32_t j = 0; j < memsz - filesz; j++) {
bss_start[j] = 0; bss_start[j] = 0;
} }
} }
} }
return header->e_entry; // Return the entry point
} return (void *)header->e_entry;
#define KERN_START_SECT 5
#define MAX(a, b) ((a)>(b) ? (a) : (b))
extern void ata_lba_read(uint32_t lba, uint8_t nsect, void *addr);
extern uint8_t read_buf[];
static uint32_t
total_header_size(const Elf32_Ehdr *header) {
uint32_t phend = header->e_phoff + header->e_phentsize*header->e_phnum;
// Align to 512
return (phend + 511) & ~511;
}
static void read_sectors(uint8_t *vaddr, uint32_t offset, uint32_t size) {
// # of sectors to read
uint32_t rem_nsect = ((size + 511) & ~511) / 512;
// Current lba address, offset by the first sector already read
uint32_t lba = KERN_START_SECT + offset / 512;
// Max 255 sectors at a time
while (rem_nsect) {
uint8_t nsect = rem_nsect > 255 ? 255 : rem_nsect;
ata_lba_read(lba, nsect, vaddr);
vaddr += nsect * 512;
rem_nsect -= nsect;
lba += nsect;
}
} }
void *load_kernel(void) { void *load_kernel(void) {
// Read the first sector // ELF header buffer
ata_lba_read(KERN_START_SECT, 1, read_buf); uint8_t header_buf[SECTOR_SIZE];
const Elf32_Ehdr* header = (const Elf32_Ehdr*)read_buf; // Read the first sector (contains the ELF header)
ata_read_sector(header_buf, KERN_START_SECT);
// Remaining data size, subtract the first 512B already read // `elf_load()` returns the entry point
uint32_t rem = total_header_size(header) - 512; return elf_load(header_buf);
// Read the rest if necessary
if (rem)
read_sectors(read_buf+512, 512, rem);
elf_load(read_buf, read_sectors);
return (void *)header->e_entry;
} }