mirror of
https://github.com/phil-opp/blog_os.git
synced 2025-12-16 22:37:49 +00:00
Update posts to use x86_64 crate
This commit is contained in:
@@ -898,18 +898,15 @@ An x86 processor has many different caches because always accessing the main mem
|
|||||||
|
|
||||||
The translation lookaside buffer, or TLB, caches the translation of virtual to physical addresses. It's filled automatically when a page is accessed. But it's not updated transparently when the mapping of a page changes. This is the reason that we still can access the page even through we unmapped it in the page table.
|
The translation lookaside buffer, or TLB, caches the translation of virtual to physical addresses. It's filled automatically when a page is accessed. But it's not updated transparently when the mapping of a page changes. This is the reason that we still can access the page even through we unmapped it in the page table.
|
||||||
|
|
||||||
So to fix our `unmap` function, we need to remove the cached translation from the TLB. We can use Gerd Zellweger's [x86][x86 crate] crate to do this easily. To add it, we append the following to our `Cargo.toml`:
|
So to fix our `unmap` function, we need to remove the cached translation from the TLB. We can use the [x86_64][x86_64 crate] crate to do this easily. To add it, we append the following to our `Cargo.toml`:
|
||||||
|
|
||||||
[x86 crate]: https://github.com/gz/rust-x86
|
[x86_64 crate]: https://docs.rs/x86_64
|
||||||
|
|
||||||
```toml
|
```toml
|
||||||
[dependencies.x86]
|
[dependencies]
|
||||||
version = "0.8.0"
|
...
|
||||||
default-features = false
|
x86_64 = "0.1.0"
|
||||||
```
|
```
|
||||||
It has a `performance-counter` feature that allows reading the CPU specific [performance counters] but increases compile times. We don't need it right now, so we disable it using `default-features = false`.
|
|
||||||
|
|
||||||
[performance counters]: http://gz.github.io/rust-x86/x86/perfcnt/index.html
|
|
||||||
|
|
||||||
Now we can use it to fix `unmap`:
|
Now we can use it to fix `unmap`:
|
||||||
|
|
||||||
@@ -917,7 +914,9 @@ It has a `performance-counter` feature that allows reading the CPU specific [per
|
|||||||
...
|
...
|
||||||
p1[page.p1_index()].set_unused();
|
p1[page.p1_index()].set_unused();
|
||||||
unsafe {
|
unsafe {
|
||||||
::x86::shared::tlb::flush(page.start_address());
|
use x86_64::instructions::tlb;
|
||||||
|
use x86_64::VirtualAddress;
|
||||||
|
tlb::flush(VirtualAddress(page.start_address()));
|
||||||
}
|
}
|
||||||
// TODO free p(1,2,3) table if empty
|
// TODO free p(1,2,3) table if empty
|
||||||
//allocator.deallocate_frame(frame);
|
//allocator.deallocate_frame(frame);
|
||||||
|
|||||||
@@ -345,12 +345,11 @@ pub fn with<F>(&mut self,
|
|||||||
f: F)
|
f: F)
|
||||||
where F: FnOnce(&mut ActivePageTable)
|
where F: FnOnce(&mut ActivePageTable)
|
||||||
{
|
{
|
||||||
use x86::shared::tlb;
|
use x86_64::instructions::tlb;
|
||||||
let flush_tlb = || unsafe { tlb::flush_all() };
|
|
||||||
|
|
||||||
// overwrite recursive mapping
|
// overwrite recursive mapping
|
||||||
self.p4_mut()[511].set(table.p4_frame.clone(), PRESENT | WRITABLE);
|
self.p4_mut()[511].set(table.p4_frame.clone(), PRESENT | WRITABLE);
|
||||||
flush_tlb();
|
tlb::flush_all();
|
||||||
|
|
||||||
// execute f in the new context
|
// execute f in the new context
|
||||||
f(self);
|
f(self);
|
||||||
@@ -449,7 +448,7 @@ Right now, the `with` function overwrites the recursive mapping and calls the cl
|
|||||||
To backup the physical P4 frame of the active table, we can either read it from the 511th P4 entry (before we change it) or from the CR3 control register directly. We will do the latter as it should be faster and we already have a external crate that makes it easy:
|
To backup the physical P4 frame of the active table, we can either read it from the 511th P4 entry (before we change it) or from the CR3 control register directly. We will do the latter as it should be faster and we already have a external crate that makes it easy:
|
||||||
|
|
||||||
```rust
|
```rust
|
||||||
use x86::shared::control_regs;
|
use x86_64::shared::control_regs;
|
||||||
let backup = Frame::containing_address(
|
let backup = Frame::containing_address(
|
||||||
unsafe { control_regs::cr3() } as usize
|
unsafe { control_regs::cr3() } as usize
|
||||||
);
|
);
|
||||||
@@ -482,8 +481,8 @@ pub fn with<F>(&mut self,
|
|||||||
f: F)
|
f: F)
|
||||||
where F: FnOnce(&mut Mapper)
|
where F: FnOnce(&mut Mapper)
|
||||||
{
|
{
|
||||||
use x86::shared::{control_regs, tlb};
|
use x86_64::instructions::tlb;
|
||||||
let flush_tlb = || unsafe { tlb::flush_all() };
|
use x86_64::shared::{control_regs, tlb};
|
||||||
|
|
||||||
{
|
{
|
||||||
let backup = Frame::containing_address(
|
let backup = Frame::containing_address(
|
||||||
@@ -494,14 +493,14 @@ pub fn with<F>(&mut self,
|
|||||||
|
|
||||||
// overwrite recursive mapping
|
// overwrite recursive mapping
|
||||||
self.p4_mut()[511].set(table.p4_frame.clone(), PRESENT | WRITABLE);
|
self.p4_mut()[511].set(table.p4_frame.clone(), PRESENT | WRITABLE);
|
||||||
flush_tlb();
|
tlb::flush_all();
|
||||||
|
|
||||||
// execute f in the new context
|
// execute f in the new context
|
||||||
f(self);
|
f(self);
|
||||||
|
|
||||||
// restore recursive mapping to original p4 table
|
// restore recursive mapping to original p4 table
|
||||||
p4_table[511].set(backup, PRESENT | WRITABLE);
|
p4_table[511].set(backup, PRESENT | WRITABLE);
|
||||||
flush_tlb();
|
tlb::flush_all();
|
||||||
}
|
}
|
||||||
|
|
||||||
temporary_page.unmap(self);
|
temporary_page.unmap(self);
|
||||||
@@ -755,7 +754,7 @@ We do this in a new `ActivePageTable::switch` method:
|
|||||||
// in `impl ActivePageTable` in src/memory/paging/mod.rs
|
// in `impl ActivePageTable` in src/memory/paging/mod.rs
|
||||||
|
|
||||||
pub fn switch(&mut self, new_table: InactivePageTable) -> InactivePageTable {
|
pub fn switch(&mut self, new_table: InactivePageTable) -> InactivePageTable {
|
||||||
use x86::shared::control_regs;
|
use x86_64::shared::control_regs;
|
||||||
|
|
||||||
let old_table = InactivePageTable {
|
let old_table = InactivePageTable {
|
||||||
p4_frame: Frame::containing_address(
|
p4_frame: Frame::containing_address(
|
||||||
@@ -976,7 +975,7 @@ So we need to enable the `NXE` bit. For that we use the awesome [x86][rust-x86]
|
|||||||
// in lib.rs
|
// in lib.rs
|
||||||
|
|
||||||
fn enable_nxe_bit() {
|
fn enable_nxe_bit() {
|
||||||
use x86::shared::msr::{IA32_EFER, rdmsr, wrmsr};
|
use x86_64::shared::msr::{IA32_EFER, rdmsr, wrmsr};
|
||||||
|
|
||||||
let nxe_bit = 1 << 11;
|
let nxe_bit = 1 << 11;
|
||||||
unsafe {
|
unsafe {
|
||||||
@@ -996,7 +995,7 @@ Right now, we are still able to modify the `.code` and `.rodata` sections, even
|
|||||||
// in lib.rs
|
// in lib.rs
|
||||||
|
|
||||||
fn enable_write_protect_bit() {
|
fn enable_write_protect_bit() {
|
||||||
use x86::shared::control_regs::{cr0, cr0_write, CR0_WRITE_PROTECT};
|
use x86_64::shared::control_regs::{cr0, cr0_write, CR0_WRITE_PROTECT};
|
||||||
|
|
||||||
unsafe { cr0_write(cr0() | CR0_WRITE_PROTECT) };
|
unsafe { cr0_write(cr0() | CR0_WRITE_PROTECT) };
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -84,8 +84,9 @@ Now we create types for the IDT and its entries:
|
|||||||
```rust
|
```rust
|
||||||
// src/interrupts/idt.rs
|
// src/interrupts/idt.rs
|
||||||
|
|
||||||
use x86::shared::segmentation::{self, SegmentSelector};
|
use x86_64::instructions::segmentation;
|
||||||
use x86::shared::PrivilegeLevel;
|
use x86_64::structures::gdt::SegmentSelector;
|
||||||
|
use x86_64::PrivilegeLevel;
|
||||||
|
|
||||||
pub struct Idt([Entry; 16]);
|
pub struct Idt([Entry; 16]);
|
||||||
|
|
||||||
@@ -279,10 +280,9 @@ impl Idt {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
```
|
```
|
||||||
The method overwrites the specified entry with the given handler function. We use the `segmentation::cs`[^fn-segmentation-cs] function of the [x86 crate] to get the current code segment descriptor. There's no need for different kernel code segments in long mode, so the current `cs` value should be always the right choice.
|
The method overwrites the specified entry with the given handler function. We use the `segmentation::cs` function of the [x86_64 crate] to get the current code segment descriptor. There's no need for different kernel code segments in long mode, so the current `cs` value should be always the right choice.
|
||||||
|
|
||||||
[x86 crate]: https://github.com/gz/rust-x86
|
[x86_64 crate]: https://docs.rs/x86_64
|
||||||
[^fn-segmentation-cs]: The `segmentation::cs` function was [added](https://github.com/gz/rust-x86/pull/12) in version 0.7.0, so you might need to update your `x86` version in your `Cargo.toml`.
|
|
||||||
|
|
||||||
By returning a mutual reference to the entry's options, we allow the caller to override the default settings. For example, the caller could add a non-present entry by executing: `idt.set_handler(11, handler_fn).set_present(false)`.
|
By returning a mutual reference to the entry's options, we allow the caller to override the default settings. For example, the caller could add a non-present entry by executing: `idt.set_handler(11, handler_fn).set_present(false)`.
|
||||||
|
|
||||||
@@ -299,19 +299,19 @@ Type | Name | Description
|
|||||||
u16 | Limit | The maximum addressable byte in the table. Equal to the table size in bytes minus 1.
|
u16 | Limit | The maximum addressable byte in the table. Equal to the table size in bytes minus 1.
|
||||||
u64 | Offset | Virtual start address of the table.
|
u64 | Offset | Virtual start address of the table.
|
||||||
|
|
||||||
This structure is already contained [in the x86 crate], so we don't need to create it ourselves. The same is true for the [lidt function]. So we just need to put the pieces together to create a `load` method:
|
This structure is already contained [in the x86_64 crate], so we don't need to create it ourselves. The same is true for the [lidt function]. So we just need to put the pieces together to create a `load` method:
|
||||||
|
|
||||||
[in the x86 crate]: http://gz.github.io/rust-x86/x86/dtables/struct.DescriptorTablePointer.html
|
[in the x86_64 crate]: http://docs.rs/x86_64/0.1.0/x86_64/instructions/tables/struct.DescriptorTablePointer.html
|
||||||
[lidt function]: http://gz.github.io/rust-x86/x86/dtables/fn.lidt.html
|
[lidt function]: http://docs.rs/x86_64/0.1.0/x86_64/instructions/tables/fn.lidt.html
|
||||||
|
|
||||||
```rust
|
```rust
|
||||||
impl Idt {
|
impl Idt {
|
||||||
pub fn load(&self) {
|
pub fn load(&self) {
|
||||||
use x86::shared::dtables::{DescriptorTablePointer, lidt};
|
use x86_64::instructions::tables::{DescriptorTablePointer, lidt};
|
||||||
use core::mem::size_of;
|
use core::mem::size_of;
|
||||||
|
|
||||||
let ptr = DescriptorTablePointer {
|
let ptr = DescriptorTablePointer {
|
||||||
base: self as *const _ as *const ::x86::bits64::irq::IdtEntry,
|
base: self as *const _ as u64,
|
||||||
limit: (size_of::<Self>() - 1) as u16,
|
limit: (size_of::<Self>() - 1) as u16,
|
||||||
};
|
};
|
||||||
|
|
||||||
@@ -319,9 +319,7 @@ impl Idt {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
```
|
```
|
||||||
The method does not need to modify the IDT, so it takes `self` by immutable reference. First, we create a `DescriptorTablePointer` and then we pass it to `lidt`. The `lidt` function expects that the `base` field has the type `x86::bits64::irq::IdtEntry`[^fn-x86-idt-entry], therefore we need to cast the `self` pointer. For calculating the `limit` we use [mem::size_of]. The additional `-1` is needed because the limit field has to be the maximum addressable byte (inclusive bound). We need an unsafe block around `lidt`, because the function assumes that the specified handler addresses are valid.
|
The method does not need to modify the IDT, so it takes `self` by immutable reference. First, we create a `DescriptorTablePointer` and then we pass it to `lidt`. The `lidt` function expects that the `base` field has the type `u64`, therefore we need to cast the `self` pointer. For calculating the `limit` we use [mem::size_of]. The additional `-1` is needed because the limit field has to be the maximum addressable byte (inclusive bound). We need an unsafe block around `lidt`, because the function assumes that the specified handler addresses are valid.
|
||||||
|
|
||||||
[^fn-x86-idt-entry]: The `x86` crate has its own `IdtEntry` type, but it is a bit incomplete. Therefore we created our own IDT types.
|
|
||||||
|
|
||||||
[mem::size_of]: https://doc.rust-lang.org/nightly/core/mem/fn.size_of.html
|
[mem::size_of]: https://doc.rust-lang.org/nightly/core/mem/fn.size_of.html
|
||||||
|
|
||||||
|
|||||||
@@ -148,7 +148,7 @@ If you want to try it, insert it in `src/lib.rs` and call it from `rust_main`. W
|
|||||||
[...]
|
[...]
|
||||||
000000000010df90 <_ZN7blog_os22naked_function_example17ha9f733dfe42b595dE>:
|
000000000010df90 <_ZN7blog_os22naked_function_example17ha9f733dfe42b595dE>:
|
||||||
10df90: 48 c7 c0 2a 00 00 00 mov $0x42,%rax
|
10df90: 48 c7 c0 2a 00 00 00 mov $0x42,%rax
|
||||||
10df97: c3 retq
|
10df97: c3 retq
|
||||||
10df98: 0f 1f 84 00 00 00 00 nopl 0x0(%rax,%rax,1)
|
10df98: 0f 1f 84 00 00 00 00 nopl 0x0(%rax,%rax,1)
|
||||||
10df9f: 00
|
10df9f: 00
|
||||||
```
|
```
|
||||||
@@ -629,7 +629,7 @@ Now we can improve our page fault error message by using the new `PageFaultError
|
|||||||
extern "C" fn page_fault_handler(stack_frame: &ExceptionStackFrame,
|
extern "C" fn page_fault_handler(stack_frame: &ExceptionStackFrame,
|
||||||
error_code: u64) -> !
|
error_code: u64) -> !
|
||||||
{
|
{
|
||||||
use x86::shared::control_regs;
|
use x86_64::registers::control_regs;
|
||||||
println!(
|
println!(
|
||||||
"\nEXCEPTION: PAGE FAULT while accessing {:#x}\
|
"\nEXCEPTION: PAGE FAULT while accessing {:#x}\
|
||||||
\nerror code: {:?}\n{:#?}",
|
\nerror code: {:?}\n{:#?}",
|
||||||
|
|||||||
@@ -79,7 +79,7 @@ In order to test it, we insert an `int3` instruction in our `rust_main`:
|
|||||||
// in src/lib.rs
|
// in src/lib.rs
|
||||||
...
|
...
|
||||||
#[macro_use] // needed for the `int!` macro
|
#[macro_use] // needed for the `int!` macro
|
||||||
extern crate x86;
|
extern crate x86_64;
|
||||||
...
|
...
|
||||||
|
|
||||||
#[no_mangle]
|
#[no_mangle]
|
||||||
|
|||||||
@@ -41,10 +41,9 @@ pub extern "C" fn rust_main(multiboot_information_address: usize) {
|
|||||||
}
|
}
|
||||||
{{< / highlight >}}
|
{{< / highlight >}}
|
||||||
|
|
||||||
We use the [int! macro] of the [x86 crate] to trigger the exception with vector number `1`, which is the [debug exception]. The debug exception occurs for example when a breakpoint defined in the [debug registers] is hit. Like the [breakpoint exception], it is mainly used for [implementing debuggers].
|
We use the [int! macro] of the `x86_64` crate to trigger the exception with vector number `1`, which is the [debug exception]. The debug exception occurs for example when a breakpoint defined in the [debug registers] is hit. Like the [breakpoint exception], it is mainly used for [implementing debuggers].
|
||||||
|
|
||||||
[int! macro]: https://docs.rs/x86/0.8.0/x86/macro.int!.html
|
[int! macro]: https://docs.rs/x86_64/0.1.0/x86_64/macro.int!.html
|
||||||
[x86 crate]: https://github.com/gz/rust-x86
|
|
||||||
[debug exception]: http://wiki.osdev.org/Exceptions#Debug
|
[debug exception]: http://wiki.osdev.org/Exceptions#Debug
|
||||||
[debug registers]: https://en.wikipedia.org/wiki/X86_debug_register
|
[debug registers]: https://en.wikipedia.org/wiki/X86_debug_register
|
||||||
[breakpoint exception]: http://wiki.osdev.org/Exceptions#Breakpoint
|
[breakpoint exception]: http://wiki.osdev.org/Exceptions#Breakpoint
|
||||||
@@ -476,7 +475,7 @@ Let's create a new TSS that contains our double fault stack in its interrupt sta
|
|||||||
```rust
|
```rust
|
||||||
// in src/interrupts/mod.rs
|
// in src/interrupts/mod.rs
|
||||||
|
|
||||||
use x86::bits64::task::TaskStateSegment;
|
use x86_64::structures::tss::TaskStateSegment;
|
||||||
```
|
```
|
||||||
|
|
||||||
Let's create a new TSS in our `interrupts::init` function:
|
Let's create a new TSS in our `interrupts::init` function:
|
||||||
@@ -624,7 +623,7 @@ Let's add a function to our descriptor that creates a TSS descriptor for a given
|
|||||||
```rust
|
```rust
|
||||||
// in src/interrupts/gdt.rs
|
// in src/interrupts/gdt.rs
|
||||||
|
|
||||||
use x86::bits64::task::TaskStateSegment;
|
use x86_64::structures::tss::TaskStateSegment;
|
||||||
|
|
||||||
impl Descriptor {
|
impl Descriptor {
|
||||||
pub fn tss_segment(tss: &'static TaskStateSegment) -> Descriptor {
|
pub fn tss_segment(tss: &'static TaskStateSegment) -> Descriptor {
|
||||||
@@ -660,8 +659,8 @@ In order to add descriptors to the GDT, we add a `add_entry` method:
|
|||||||
```rust
|
```rust
|
||||||
// in src/interrupts/gdt.rs
|
// in src/interrupts/gdt.rs
|
||||||
|
|
||||||
use x86::shared::segmentation::SegmentSelector;
|
use x86_64::structures::gdt::SegmentSelector;
|
||||||
use x86::shared::PrivilegeLevel;
|
use x86_64::PrivilegeLevel;
|
||||||
|
|
||||||
impl Gdt {
|
impl Gdt {
|
||||||
pub fn add_entry(&mut self, entry: Descriptor) -> SegmentSelector {
|
pub fn add_entry(&mut self, entry: Descriptor) -> SegmentSelector {
|
||||||
@@ -709,8 +708,8 @@ To load the GDT, we add a new `load` method:
|
|||||||
|
|
||||||
impl Gdt {
|
impl Gdt {
|
||||||
pub fn load(&'static self) {
|
pub fn load(&'static self) {
|
||||||
use x86::shared::dtables::{DescriptorTablePointer, lgdt};
|
use x86_64::instructions::tables::{DescriptorTablePointer, lgdt};
|
||||||
use x86::shared::segmentation;
|
use x86_64::instructions::segmentation;
|
||||||
use core::mem::size_of;
|
use core::mem::size_of;
|
||||||
|
|
||||||
let ptr = DescriptorTablePointer {
|
let ptr = DescriptorTablePointer {
|
||||||
@@ -847,8 +846,9 @@ For the first two steps, we need access to the `code_selector` and `tss_selector
|
|||||||
{{< highlight rust "hl_lines=3 4 7 8 11 12 19 21" >}}
|
{{< highlight rust "hl_lines=3 4 7 8 11 12 19 21" >}}
|
||||||
// in src/interrupts/mod.rs
|
// in src/interrupts/mod.rs
|
||||||
pub fn init(memory_controller: &mut MemoryController) {
|
pub fn init(memory_controller: &mut MemoryController) {
|
||||||
use x86::shared::segmentation::{SegmentSelector, set_cs};
|
use x86_64::structures::gdt::SegmentSelector;
|
||||||
use x86::shared::task::load_tr;
|
use x86_64::instructions::segmentation::set_cs;
|
||||||
|
use x86_64::instructions::tables::load_tss;
|
||||||
...
|
...
|
||||||
|
|
||||||
let mut code_selector = SegmentSelector::empty();
|
let mut code_selector = SegmentSelector::empty();
|
||||||
@@ -865,17 +865,17 @@ pub fn init(memory_controller: &mut MemoryController) {
|
|||||||
// reload code segment register
|
// reload code segment register
|
||||||
set_cs(code_selector);
|
set_cs(code_selector);
|
||||||
// load TSS
|
// load TSS
|
||||||
load_tr(tss_selector);
|
load_tss(tss_selector);
|
||||||
}
|
}
|
||||||
|
|
||||||
IDT.load();
|
IDT.load();
|
||||||
}
|
}
|
||||||
{{< / highlight >}}
|
{{< / highlight >}}
|
||||||
|
|
||||||
We first set the descriptors to `empty` and then update them from inside the closure (which implicitly borrows them as `&mut`). Now we're able to reload the code segment register using [`set_cs`] and to load the TSS using [`load_tr`].
|
We first set the descriptors to `empty` and then update them from inside the closure (which implicitly borrows them as `&mut`). Now we're able to reload the code segment register using [`set_cs`] and to load the TSS using [`load_tss`].
|
||||||
|
|
||||||
[`set_cs`]: https://docs.rs/x86/0.8.0/x86/shared/segmentation/fn.set_cs.html
|
[`set_cs`]: https://docs.rs/x86/0.8.0/x86/shared/segmentation/fn.set_cs.html
|
||||||
[`load_tr`]: https://docs.rs/x86/0.8.0/x86/shared/task/fn.load_tr.html
|
[`load_tss`]: https://docs.rs/x86/0.8.0/x86/shared/task/fn.load_tss.html
|
||||||
|
|
||||||
Now that we loaded a valid TSS and interrupt stack table, we can set the stack index for our double fault handler in the IDT:
|
Now that we loaded a valid TSS and interrupt stack table, we can set the stack index for our double fault handler in the IDT:
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user