From b5a00f7a071d0a181a92ee870054b020350273e9 Mon Sep 17 00:00:00 2001
From: Vladimir Serbinenko <phcoder@gmail.com>
Date: Mon, 24 Feb 2025 17:51:35 +0300
Subject: [PATCH 1/2] Support X2APIC

It's needed in order to boot on Meteor Lake CPUs
---
 arch/x86_32/kernel.s | 21 -------------
 arch/x86_64/kernel.s | 26 ---------------
 arch/x86_pc.cpp      | 75 ++++++++++++++++++++++++++++++++++++++------
 3 files changed, 65 insertions(+), 57 deletions(-)

diff --git a/arch/x86_32/kernel.s b/arch/x86_32/kernel.s
index 5d49453..1aa36f9 100644
--- a/arch/x86_32/kernel.s
+++ b/arch/x86_32/kernel.s
@@ -225,27 +225,6 @@ SetupProcessor1:
 	lidt	[idt]
 	sti
 
-	; Enable the APIC.
-	; TODO Check it is actually present!
-	mov	ecx,0x1B
-	rdmsr
-	or	eax,0x800
-	wrmsr
-
-	; Set the spurious interrupt vector to 0xFF
-	mov	eax,0xEC3FF0F0
-	mov	ebx,[eax]
-	or	ebx,0x1FF
-	mov	[eax],ebx
-
-	; Use the flat processor addressing model
-	mov	eax,0xEC3FF0E0
-	mov	dword [eax],0xFFFFFFFF
-
-	; Make sure that no external interrupts are masked
-	xor	eax,eax
-	mov	[0xEC3FF080],eax
-
 	; TODO More feature detection and initialisation!
 
 	ret
diff --git a/arch/x86_64/kernel.s b/arch/x86_64/kernel.s
index 2b938ce..1ab83b5 100644
--- a/arch/x86_64/kernel.s
+++ b/arch/x86_64/kernel.s
@@ -327,32 +327,6 @@ SetupProcessor1:
 	lidt	[rax]
 	sti
 
-	.enable_apic:
-	; Enable the APIC!
-	; Since we're on AMD64, we know that the APIC will be present.
-	mov	ecx,0x1B
-	rdmsr
-	or	eax,0x800
-	wrmsr
-	and	eax,~0xFFF
-	mov	edi,eax
-
-	; Set the spurious interrupt vector to 0xFF
-	mov	rax,0xFFFFFE00000000F0 ; LOW_MEMORY_MAP_START + 0xF0
-	add	rax,rdi
-	mov	ebx,[rax]
-	or	ebx,0x1FF
-	mov	[rax],ebx
-
-	; Use the flat processor addressing model
-	mov	rax,0xFFFFFE00000000E0 ; LOW_MEMORY_MAP_START + 0xE0
-	add	rax,rdi
-	mov	dword [rax],0xFFFFFFFF
-
-	; Make sure that no external interrupts are masked
-	xor	rax,rax
-	mov	cr8,rax
-
 	ret
 
 SyscallEntry:
diff --git a/arch/x86_pc.cpp b/arch/x86_pc.cpp
index 2bf13a2..0cf4cda 100644
--- a/arch/x86_pc.cpp
+++ b/arch/x86_pc.cpp
@@ -41,6 +41,8 @@ uintptr_t physicalMemoryHighest;
 uint32_t bootloaderID;
 uintptr_t bootloaderInformationOffset;
 
+bool x2apic = false;
+
 // Spinlock since some drivers need to access it in IRQs (e.g. ACPICA).
 KSpinlock pciConfigSpinlock; 
 
@@ -81,7 +83,27 @@ const char *const exceptionInformation[] = {
 	"0x1F: Reserved/Unknown",
 };
 
+static uint64_t rdmsr(uint32_t msr_id)
+{
+	uint32_t low, high;
+
+	asm volatile ("rdmsr" : "=a" (low), "=d" (high) : "c" (msr_id));
+
+	return ((uint64_t) high << 32) | low;
+}
+
+static void wrmsr (uint32_t msr_id, uint64_t msr_value)
+{
+	uint32_t low = msr_value, high = msr_value >> 32;
+
+	asm volatile ("wrmsr" : : "c" (msr_id), "a" (low), "d" (high));
+}
+
+
 uint32_t LapicReadRegister(uint32_t reg) {
+	if (x2apic) {
+		return rdmsr(0x800 + (reg >> 2));
+	}
 #ifdef ES_ARCH_X86_64
 	return acpi.lapicAddress[reg];
 #else
@@ -90,6 +112,10 @@ uint32_t LapicReadRegister(uint32_t reg) {
 }
 
 void LapicWriteRegister(uint32_t reg, uint32_t value) {
+	if (x2apic) {
+		wrmsr(0x800 + (reg >> 2), value);
+		return;
+	}
 #ifdef ES_ARCH_X86_64
 	acpi.lapicAddress[reg] = value;
 #else
@@ -97,6 +123,16 @@ void LapicWriteRegister(uint32_t reg, uint32_t value) {
 #endif
 }
 
+static void write_icr(uint32_t apic_id, uint32_t low) {
+	if (x2apic) {
+		wrmsr(0x830, (((uint64_t)apic_id) << 32) | low);
+		return;
+	}
+
+	LapicWriteRegister(0x310 >> 2, apic_id << 24);
+	LapicWriteRegister(0x300 >> 2, low);
+}
+
 void LapicNextTimer(size_t ms) {
 	LapicWriteRegister(0x320 >> 2, TIMER_INTERRUPT | (1 << 17)); 
 	LapicWriteRegister(0x380 >> 2, acpi.lapicTicksPerMs * ms); 
@@ -640,6 +676,22 @@ NewProcessorStorage AllocateNewProcessorStorage(ArchCPU *archCPU) {
 }
 
 void SetupProcessor2(NewProcessorStorage *storage) {
+	// Enable the APIC!
+	// TODO Check it is actually present!
+	// on AMD64, we know that the APIC will be present.
+	wrmsr(0x1b, rdmsr(0x1b) | 0x800 | (x2apic ? (1 << 10) : 0));
+
+	// Set the spurious interrupt vector to 0xFF
+	LapicWriteRegister(0xF0 >> 2, LapicReadRegister(0xF0 >> 2) | 0x1ff);
+
+	// Use the flat processor addressing model
+	if (!x2apic) {
+		LapicWriteRegister(0xE0 >> 2, 0xFFFFFFFF);
+	}
+
+	// Make sure that no external interrupts are masked
+	ProcessorEnableInterrupts();
+
 	// Setup the local interrupts for the current processor.
 		
 	for (uintptr_t i = 0; i < acpi.lapicNMICount; i++) {
@@ -682,7 +734,9 @@ void SetupProcessor2(NewProcessorStorage *storage) {
 void ArchInitialise() {
 	ACPIParseTables();
 
-	uint8_t bootstrapLapicID = (LapicReadRegister(0x20 >> 2) >> 24); 
+	x2apic = !!(rdmsr(0x1b) & (1 << 10));
+
+	uint8_t bootstrapLapicID = x2apic ? LapicReadRegister(0x20 >> 2) : (LapicReadRegister(0x20 >> 2) >> 24);
 
 	ArchCPU *currentCPU = nullptr;
 
@@ -695,6 +749,12 @@ void ArchInitialise() {
 		}
 	}
 
+	if (x2apic) {
+		EsPrint("Using x2apic, boot CPU id %d (apicid 0x%x)\n", currentCPU, bootstrapLapicID);
+	} else {
+		EsPrint("Using xapic, boot CPU id %d (apicid 0x%x)\n", currentCPU, bootstrapLapicID);
+	}
+
 	if (!currentCPU) {
 		KernelPanic("ArchInitialise - Could not find the bootstrap processor\n");
 	}
@@ -743,10 +803,8 @@ size_t ProcessorSendIPI(uintptr_t interrupt, bool nmi, int processorID) {
 			}
 		}
 
-		uint32_t destination = acpi.processors[i].apicID << 24;
 		uint32_t command = interrupt | (1 << 14) | (nmi ? 0x400 : 0);
-		LapicWriteRegister(0x310 >> 2, destination);
-		LapicWriteRegister(0x300 >> 2, command); 
+		write_icr(acpi.processors[i].apicID, command); 
 
 		// Wait for the interrupt to be sent.
 		while (LapicReadRegister(0x300 >> 2) & (1 << 12));
@@ -1049,15 +1107,13 @@ void ArchStartupApplicationProcessors() {
 
 		// Send an INIT IPI.
 		ProcessorDisableInterrupts(); // Don't be interrupted between writes...
-		LapicWriteRegister(0x310 >> 2, processor->apicID << 24);
-		LapicWriteRegister(0x300 >> 2, 0x4500);
+		write_icr(processor->apicID, 0x4500);
 		ProcessorEnableInterrupts();
 		KEventWait(&delay, 10);
 
 		// Send a startup IPI.
 		ProcessorDisableInterrupts();
-		LapicWriteRegister(0x310 >> 2, processor->apicID << 24);
-		LapicWriteRegister(0x300 >> 2, 0x4600 | (AP_TRAMPOLINE >> K_PAGE_BITS));
+		write_icr(processor->apicID, 0x4600 | (AP_TRAMPOLINE >> K_PAGE_BITS));
 		ProcessorEnableInterrupts();
 		for (uintptr_t i = 0; i < 100 && *startupFlag == 0; i++) KEventWait(&delay, 1);
 
@@ -1066,8 +1122,7 @@ void ArchStartupApplicationProcessors() {
 		} else {
 			// Send a startup IPI, again.
 			ProcessorDisableInterrupts();
-			LapicWriteRegister(0x310 >> 2, processor->apicID << 24);
-			LapicWriteRegister(0x300 >> 2, 0x4600 | (AP_TRAMPOLINE >> K_PAGE_BITS));
+			write_icr(processor->apicID, 0x4600 | (AP_TRAMPOLINE >> K_PAGE_BITS));
 			ProcessorEnableInterrupts();
 			for (uintptr_t i = 0; i < 1000 && *startupFlag == 0; i++) KEventWait(&delay, 1); // Wait longer this time.
 

From 026b18e6314879a07fa585f7f861827e4892668d Mon Sep 17 00:00:00 2001
From: Vladimir Serbinenko <phcoder@gmail.com>
Date: Mon, 24 Feb 2025 17:58:14 +0300
Subject: [PATCH 2/2] Don't assume that BSP has lapicid 0

On Meteor LAke it has ID 0x20 and results in missing interrupts
---
 arch/x86_pc.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/arch/x86_pc.cpp b/arch/x86_pc.cpp
index 0cf4cda..bd489f7 100644
--- a/arch/x86_pc.cpp
+++ b/arch/x86_pc.cpp
@@ -42,6 +42,7 @@ uint32_t bootloaderID;
 uintptr_t bootloaderInformationOffset;
 
 bool x2apic = false;
+uint32_t bootstrapLapicID;
 
 // Spinlock since some drivers need to access it in IRQs (e.g. ACPICA).
 KSpinlock pciConfigSpinlock; 
@@ -736,7 +737,7 @@ void ArchInitialise() {
 
 	x2apic = !!(rdmsr(0x1b) & (1 << 10));
 
-	uint8_t bootstrapLapicID = x2apic ? LapicReadRegister(0x20 >> 2) : (LapicReadRegister(0x20 >> 2) >> 24);
+	bootstrapLapicID = x2apic ? LapicReadRegister(0x20 >> 2) : (LapicReadRegister(0x20 >> 2) >> 24);
 
 	ArchCPU *currentCPU = nullptr;
 
@@ -1003,7 +1004,7 @@ KMSIInformation KRegisterMSI(KIRQHandler handler, void *context, const char *cOw
 				INTERRUPT_VECTOR_MSI_START + i, cOwnerName);
 
 		return {
-			.address = 0xFEE00000,
+			.address = 0xFEE00000 | (bootstrapLapicID << 12),
 			.data = INTERRUPT_VECTOR_MSI_START + i,
 			.tag = i,
 		};