Project

General

Profile

Statistics
| Revision:

root / lab4 / .minix-src / include / i386 / pte.h @ 14

History | View | Annotate | Download (11.1 KB)

1 13 up20180614
/*        $NetBSD: pte.h,v 1.27 2011/02/01 20:09:08 chuck Exp $        */
2
3
/*
4
 * Copyright (c) 2001 Wasabi Systems, Inc.
5
 * All rights reserved.
6
 *
7
 * Written by Frank van der Linden for Wasabi Systems, Inc.
8
 *
9
 * Redistribution and use in source and binary forms, with or without
10
 * modification, are permitted provided that the following conditions
11
 * are met:
12
 * 1. Redistributions of source code must retain the above copyright
13
 *    notice, this list of conditions and the following disclaimer.
14
 * 2. Redistributions in binary form must reproduce the above copyright
15
 *    notice, this list of conditions and the following disclaimer in the
16
 *    documentation and/or other materials provided with the distribution.
17
 * 3. All advertising materials mentioning features or use of this software
18
 *    must display the following acknowledgement:
19
 *      This product includes software developed for the NetBSD Project by
20
 *      Wasabi Systems, Inc.
21
 * 4. The name of Wasabi Systems, Inc. may not be used to endorse
22
 *    or promote products derived from this software without specific prior
23
 *    written permission.
24
 *
25
 * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
26
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
27
 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
28
 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL WASABI SYSTEMS, INC
29
 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
32
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
33
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
34
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
35
 * POSSIBILITY OF SUCH DAMAGE.
36
 */
37
38
/*
39
 * Copyright (c) 1997 Charles D. Cranor and Washington University.
40
 * All rights reserved.
41
 *
42
 * Redistribution and use in source and binary forms, with or without
43
 * modification, are permitted provided that the following conditions
44
 * are met:
45
 * 1. Redistributions of source code must retain the above copyright
46
 *    notice, this list of conditions and the following disclaimer.
47
 * 2. Redistributions in binary form must reproduce the above copyright
48
 *    notice, this list of conditions and the following disclaimer in the
49
 *    documentation and/or other materials provided with the distribution.
50
 *
51
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
52
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
53
 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
54
 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
55
 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
56
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
57
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
58
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
59
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
60
 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
61
 */
62
63
/*
64
 * pte.h rewritten by chuck based on the jolitz version, plus random
65
 * info on the pentium and other processors found on the net.   the
66
 * goal of this rewrite is to provide enough documentation on the MMU
67
 * hardware that the reader will be able to understand it without having
68
 * to refer to a hardware manual.
69
 */
70
71
#ifndef _I386_PTE_H_
72
#define _I386_PTE_H_
73
#ifdef _KERNEL_OPT
74
#include "opt_xen.h"
75
#endif
76
77
/*
78
 * i386 MMU hardware structure (without PAE extension):
79
 *
80
 * the i386 MMU is a two-level MMU which maps 4GB of virtual memory.
81
 * the pagesize is 4K (4096 [0x1000] bytes), although newer pentium
82
 * processors can support a 4MB pagesize as well.
83
 *
84
 * the first level table (segment table?) is called a "page directory"
85
 * and it contains 1024 page directory entries (PDEs).   each PDE is
86
 * 4 bytes (an int), so a PD fits in a single 4K page.   this page is
87
 * the page directory page (PDP).  each PDE in a PDP maps 4MB of space
88
 * (1024 * 4MB = 4GB).   a PDE contains the physical address of the
89
 * second level table: the page table.   or, if 4MB pages are being used,
90
 * then the PDE contains the PA of the 4MB page being mapped.
91
 *
92
 * a page table consists of 1024 page table entries (PTEs).  each PTE is
93
 * 4 bytes (an int), so a page table also fits in a single 4K page.  a
94
 * 4K page being used as a page table is called a page table page (PTP).
95
 * each PTE in a PTP maps one 4K page (1024 * 4K = 4MB).   a PTE contains
96
 * the physical address of the page it maps and some flag bits (described
97
 * below).
98
 *
99
 * the processor has a special register, "cr3", which points to the
100
 * the PDP which is currently controlling the mappings of the virtual
101
 * address space.
102
 *
103
 * the following picture shows the translation process for a 4K page:
104
 *
105
 * %cr3 register [PA of PDP]
106
 *      |
107
 *      |
108
 *      |   bits <31-22> of VA         bits <21-12> of VA   bits <11-0>
109
 *      |   index the PDP (0 - 1023)   index the PTP        are the page offset
110
 *      |         |                           |                  |
111
 *      |         v                           |                  |
112
 *      +--->+----------+                     |                  |
113
 *           | PD Page  |   PA of             v                  |
114
 *           |          |---PTP-------->+------------+           |
115
 *           | 1024 PDE |               | page table |--PTE--+   |
116
 *           | entries  |               | (aka PTP)  |       |   |
117
 *           +----------+               | 1024 PTE   |       |   |
118
 *                                      | entries    |       |   |
119
 *                                      +------------+       |   |
120
 *                                                           |   |
121
 *                                                bits <31-12>   bits <11-0>
122
 *                                                p h y s i c a l  a d d r
123
 *
124
 * the i386 caches PTEs in a TLB.   it is important to flush out old
125
 * TLB mappings when making a change to a mappings.   writing to the
126
 * %cr3 will flush the entire TLB.    newer processors also have an
127
 * instruction that will invalidate the mapping of a single page (which
128
 * is useful if you are changing a single mappings because it preserves
129
 * all the cached TLB entries).
130
 *
131
 * as shows, bits 31-12 of the PTE contain PA of the page being mapped.
132
 * the rest of the PTE is defined as follows:
133
 *   bit#        name        use
134
 *   11                n/a        available for OS use, hardware ignores it
135
 *   10                n/a        available for OS use, hardware ignores it
136
 *   9                n/a        available for OS use, hardware ignores it
137
 *   8                G        global bit (see discussion below)
138
 *   7                PS        page size [for PDEs] (0=4k, 1=4M <if supported>)
139
 *   6                D        dirty (modified) page
140
 *   5                A        accessed (referenced) page
141
 *   4                PCD        cache disable
142
 *   3                PWT        prevent write through (cache)
143
 *   2                U/S        user/supervisor bit (0=supervisor only, 1=both u&s)
144
 *   1                R/W        read/write bit (0=read only, 1=read-write)
145
 *   0                P        present (valid)
146
 *
147
 * notes:
148
 *  - PS is only supported on newer processors
149
 *  - PTEs with the G bit are global in the sense that they are not
150
 *    flushed from the TLB when %cr3 is written (to flush, use the
151
 *    "flush single page" instruction).   this is only supported on
152
 *    newer processors.    this bit can be used to keep the kernel's
153
 *    TLB entries around while context switching.   since the kernel
154
 *    is mapped into all processes at the same place it does not make
155
 *    sense to flush these entries when switching from one process'
156
 *    pmap to another.
157
 *
158
 * The PAE extension extends the size of the PTE to 64 bits (52bits physical
159
 * address) and is compatible with the amd64 PTE format. The first level
160
 * maps 2M, the second 1G, so a third level page table is introduced to
161
 * map the 4GB virtual address space. This PD has only 4 entries.
162
 * We can't use recursive mapping at level 3 to map the PD pages, as this
163
 * would eat one GB of address space. In addition, Xen imposes restrictions
164
 * on the entries we put in the L3 page (for example, the page pointed to by
165
 * the last slot can't be shared among different L3 pages), which makes
166
 * handling this L3 page in the same way we do for L2 on i386 (or L4 on amd64)
167
 * difficult. For most things we'll just pretend to have only 2 levels,
168
 * with the 2 high bits of the L2 index being in fact the index in the
169
 * L3.
170
 */
171
172
#if !defined(_LOCORE)
173
174
/*
175
 * here we define the data types for PDEs and PTEs
176
 */
177
#ifdef PAE
178
typedef uint64_t pd_entry_t;                /* PDE */
179
typedef uint64_t pt_entry_t;                /* PTE */
180
#else
181
typedef uint32_t pd_entry_t;                /* PDE */
182
typedef uint32_t pt_entry_t;                /* PTE */
183
#endif
184
185
#endif
186
187
/*
188
 * now we define various for playing with virtual addresses
189
 */
190
191
#ifdef PAE
192
#define        L1_SHIFT        12
193
#define        L2_SHIFT        21
194
#define        L3_SHIFT        30
195
#define        NBPD_L1                (1ULL << L1_SHIFT) /* # bytes mapped by L1 ent (4K) */
196
#define        NBPD_L2                (1ULL << L2_SHIFT) /* # bytes mapped by L2 ent (2MB) */
197
#define        NBPD_L3                (1ULL << L3_SHIFT) /* # bytes mapped by L3 ent (1GB) */
198
199
#define        L3_MASK                0xc0000000
200
#define        L2_REALMASK        0x3fe00000
201
#define        L2_MASK                (L2_REALMASK | L3_MASK)
202
#define        L1_MASK                0x001ff000
203
204
#define        L3_FRAME        (L3_MASK)
205
#define        L2_FRAME        (L3_FRAME | L2_MASK)
206
#define        L1_FRAME        (L2_FRAME|L1_MASK)
207
208
#define        PG_FRAME        0x000ffffffffff000ULL /* page frame mask */
209
#define        PG_LGFRAME        0x000fffffffe00000ULL /* large (2MB) page frame mask */
210
211
/* macros to get real L2 and L3 index, from our "extended" L2 index */
212
#define l2tol3(idx)        ((idx) >> (L3_SHIFT - L2_SHIFT))
213
#define l2tol2(idx)        ((idx) & (L2_REALMASK >>  L2_SHIFT))
214
215
#else /* PAE */
216
217
#define        L1_SHIFT        12
218
#define        L2_SHIFT        22
219
#define        NBPD_L1                (1UL << L1_SHIFT) /* # bytes mapped by L1 ent (4K) */
220
#define        NBPD_L2                (1UL << L2_SHIFT) /* # bytes mapped by L2 ent (4MB) */
221
222
#define L2_MASK                0xffc00000
223
#define L1_MASK                0x003ff000
224
225
#define L2_FRAME        (L2_MASK)
226
#define L1_FRAME        (L2_FRAME|L1_MASK)
227
228
#define        PG_FRAME        0xfffff000        /* page frame mask */
229
#define        PG_LGFRAME        0xffc00000        /* large (4MB) page frame mask */
230
231
#endif /* PAE */
232
/*
233
 * here we define the bits of the PDE/PTE, as described above:
234
 *
235
 * XXXCDC: need to rename these (PG_u == ugly).
236
 */
237
238
#define        PG_V                0x00000001        /* valid entry */
239
#define        PG_RO                0x00000000        /* read-only page */
240
#define        PG_RW                0x00000002        /* read-write page */
241
#define        PG_u                0x00000004        /* user accessible page */
242
#define        PG_PROT                0x00000806        /* all protection bits */
243
#define PG_WT                0x00000008        /* write through */
244
#define        PG_N                0x00000010        /* non-cacheable */
245
#define        PG_U                0x00000020        /* has been used */
246
#define        PG_M                0x00000040        /* has been modified */
247
#define PG_PAT                0x00000080        /* PAT (on pte) */
248
#define PG_PS                0x00000080        /* 4MB page size (2MB for PAE) */
249
#define PG_G                0x00000100        /* global, don't TLB flush */
250
#define PG_AVAIL1        0x00000200        /* ignored by hardware */
251
#define PG_AVAIL2        0x00000400        /* ignored by hardware */
252
#define PG_AVAIL3        0x00000800        /* ignored by hardware */
253
#define PG_LGPAT        0x00001000        /* PAT on large pages */
254
255
/*
256
 * various short-hand protection codes
257
 */
258
259
#define        PG_KR                0x00000000        /* kernel read-only */
260
#define        PG_KW                0x00000002        /* kernel read-write */
261
262
#ifdef PAE
263
#define        PG_NX                0x8000000000000000ULL /* No-execute */
264
#else
265
#define        PG_NX                0                /* dummy */
266
#endif
267
268
#include <x86/pte.h>
269
270
#endif /* _I386_PTE_H_ */