This source file includes following definitions.
- oom
- free_one_table
- clear_page_tables
- free_page_tables
- clone_page_tables
- copy_page_tables
- unmap_page_range
- zeromap_page_range
- remap_page_range
- put_page
- put_dirty_page
- do_wp_page
- verify_area
- get_empty_page
- try_to_share
- share_page
- get_empty_pgtable
- do_swap_page
- do_no_page
- do_page_fault
- __bad_pagetable
- __bad_page
- __zero_page
- show_mem
- paging_init
- mem_init
- si_meminfo
- file_mmap_nopage
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36 #include <asm/system.h>
37 #include <linux/config.h>
38
39 #include <linux/signal.h>
40 #include <linux/sched.h>
41 #include <linux/head.h>
42 #include <linux/kernel.h>
43 #include <linux/errno.h>
44 #include <linux/string.h>
45 #include <linux/types.h>
46 #include <linux/ptrace.h>
47 #include <linux/mman.h>
48 #include <linux/segment.h>
49 #include <asm/segment.h>
50
51
52
53
54
55
56 #undef CONFIG_TEST_VERIFY_AREA
57
58 unsigned long high_memory = 0;
59
60 extern unsigned long pg0[1024];
61
62 extern void sound_mem_init(void);
63 extern void die_if_kernel(char *,struct pt_regs *,long);
64 extern void show_net_buffers(void);
65
66
67
68
69
70 int nr_swap_pages = 0;
71 int nr_free_pages = 0;
72 struct mem_list free_area_list[NR_MEM_LISTS];
73 unsigned char * free_area_map[NR_MEM_LISTS];
74
75 #define copy_page(from,to) \
76 __asm__("cld ; rep ; movsl": :"S" (from),"D" (to),"c" (1024):"cx","di","si")
77
78 unsigned short * mem_map = NULL;
79
80 #define CODE_SPACE(addr,p) ((addr) < (p)->end_code)
81
82
83
84
85
86 void oom(struct task_struct * task)
87 {
88 printk("\nOut of memory.\n");
89 task->sigaction[SIGKILL-1].sa_handler = NULL;
90 task->blocked &= ~(1<<(SIGKILL-1));
91 send_sig(SIGKILL,task,1);
92 }
93
94 static void free_one_table(unsigned long * page_dir)
95 {
96 int j;
97 unsigned long pg_table = *page_dir;
98 unsigned long * page_table;
99
100 if (!pg_table)
101 return;
102 *page_dir = 0;
103 if (pg_table >= high_memory || !(pg_table & PAGE_PRESENT)) {
104 printk("Bad page table: [%p]=%08lx\n",page_dir,pg_table);
105 return;
106 }
107 if (mem_map[MAP_NR(pg_table)] & MAP_PAGE_RESERVED)
108 return;
109 page_table = (unsigned long *) (pg_table & PAGE_MASK);
110 for (j = 0 ; j < PTRS_PER_PAGE ; j++,page_table++) {
111 unsigned long pg = *page_table;
112
113 if (!pg)
114 continue;
115 *page_table = 0;
116 if (pg & PAGE_PRESENT)
117 free_page(PAGE_MASK & pg);
118 else
119 swap_free(pg);
120 }
121 free_page(PAGE_MASK & pg_table);
122 }
123
124
125
126
127
128
129
130
131 void clear_page_tables(struct task_struct * tsk)
132 {
133 int i;
134 unsigned long pg_dir;
135 unsigned long * page_dir;
136
137 if (!tsk)
138 return;
139 if (tsk == task[0])
140 panic("task[0] (swapper) doesn't support exec()\n");
141 pg_dir = tsk->tss.cr3;
142 page_dir = (unsigned long *) pg_dir;
143 if (!page_dir || page_dir == swapper_pg_dir) {
144 printk("Trying to clear kernel page-directory: not good\n");
145 return;
146 }
147 if (mem_map[MAP_NR(pg_dir)] > 1) {
148 unsigned long * new_pg;
149
150 if (!(new_pg = (unsigned long*) get_free_page(GFP_KERNEL))) {
151 oom(tsk);
152 return;
153 }
154 for (i = 768 ; i < 1024 ; i++)
155 new_pg[i] = page_dir[i];
156 free_page(pg_dir);
157 tsk->tss.cr3 = (unsigned long) new_pg;
158 return;
159 }
160 for (i = 0 ; i < 768 ; i++,page_dir++)
161 free_one_table(page_dir);
162 invalidate();
163 return;
164 }
165
166
167
168
169 void free_page_tables(struct task_struct * tsk)
170 {
171 int i;
172 unsigned long pg_dir;
173 unsigned long * page_dir;
174
175 if (!tsk)
176 return;
177 if (tsk == task[0]) {
178 printk("task[0] (swapper) killed: unable to recover\n");
179 panic("Trying to free up swapper memory space");
180 }
181 pg_dir = tsk->tss.cr3;
182 if (!pg_dir || pg_dir == (unsigned long) swapper_pg_dir) {
183 printk("Trying to free kernel page-directory: not good\n");
184 return;
185 }
186 tsk->tss.cr3 = (unsigned long) swapper_pg_dir;
187 if (tsk == current)
188 __asm__ __volatile__("movl %0,%%cr3": :"a" (tsk->tss.cr3));
189 if (mem_map[MAP_NR(pg_dir)] > 1) {
190 free_page(pg_dir);
191 return;
192 }
193 page_dir = (unsigned long *) pg_dir;
194 for (i = 0 ; i < PTRS_PER_PAGE ; i++,page_dir++)
195 free_one_table(page_dir);
196 free_page(pg_dir);
197 invalidate();
198 }
199
200
201
202
203
204
205
206 int clone_page_tables(struct task_struct * tsk)
207 {
208 unsigned long pg_dir;
209
210 pg_dir = current->tss.cr3;
211 mem_map[MAP_NR(pg_dir)]++;
212 tsk->tss.cr3 = pg_dir;
213 return 0;
214 }
215
216
217
218
219
220
221 int copy_page_tables(struct task_struct * tsk)
222 {
223 int i;
224 unsigned long old_pg_dir, *old_page_dir;
225 unsigned long new_pg_dir, *new_page_dir;
226
227 if (!(new_pg_dir = get_free_page(GFP_KERNEL)))
228 return -ENOMEM;
229 old_pg_dir = current->tss.cr3;
230 tsk->tss.cr3 = new_pg_dir;
231 old_page_dir = (unsigned long *) old_pg_dir;
232 new_page_dir = (unsigned long *) new_pg_dir;
233 for (i = 0 ; i < PTRS_PER_PAGE ; i++,old_page_dir++,new_page_dir++) {
234 int j;
235 unsigned long old_pg_table, *old_page_table;
236 unsigned long new_pg_table, *new_page_table;
237
238 old_pg_table = *old_page_dir;
239 if (!old_pg_table)
240 continue;
241 if (old_pg_table >= high_memory || !(old_pg_table & PAGE_PRESENT)) {
242 printk("copy_page_tables: bad page table: "
243 "probable memory corruption");
244 *old_page_dir = 0;
245 continue;
246 }
247 if (mem_map[MAP_NR(old_pg_table)] & MAP_PAGE_RESERVED) {
248 *new_page_dir = old_pg_table;
249 continue;
250 }
251 if (!(new_pg_table = get_free_page(GFP_KERNEL))) {
252 free_page_tables(tsk);
253 return -ENOMEM;
254 }
255 old_page_table = (unsigned long *) (PAGE_MASK & old_pg_table);
256 new_page_table = (unsigned long *) (PAGE_MASK & new_pg_table);
257 for (j = 0 ; j < PTRS_PER_PAGE ; j++,old_page_table++,new_page_table++) {
258 unsigned long pg;
259 pg = *old_page_table;
260 if (!pg)
261 continue;
262 if (!(pg & PAGE_PRESENT)) {
263 *new_page_table = swap_duplicate(pg);
264 continue;
265 }
266 if (pg > high_memory || (mem_map[MAP_NR(pg)] & MAP_PAGE_RESERVED)) {
267 *new_page_table = pg;
268 continue;
269 }
270 if (pg & PAGE_COW)
271 pg &= ~PAGE_RW;
272 if (in_swap_cache(pg)) {
273 swap_cache_invalidate(pg);
274 pg |= PAGE_DIRTY;
275 }
276 *new_page_table = pg;
277 *old_page_table = pg;
278 mem_map[MAP_NR(pg)]++;
279 }
280 *new_page_dir = new_pg_table | PAGE_TABLE;
281 }
282 invalidate();
283 return 0;
284 }
285
286
287
288
289
290 int unmap_page_range(unsigned long from, unsigned long size)
291 {
292 unsigned long page, page_dir;
293 unsigned long *page_table, *dir;
294 unsigned long poff, pcnt, pc;
295
296 if (from & ~PAGE_MASK) {
297 printk("unmap_page_range called with wrong alignment\n");
298 return -EINVAL;
299 }
300 size = (size + ~PAGE_MASK) >> PAGE_SHIFT;
301 dir = PAGE_DIR_OFFSET(current->tss.cr3,from);
302 poff = (from >> PAGE_SHIFT) & (PTRS_PER_PAGE-1);
303 if ((pcnt = PTRS_PER_PAGE - poff) > size)
304 pcnt = size;
305
306 for ( ; size > 0; ++dir, size -= pcnt,
307 pcnt = (size > PTRS_PER_PAGE ? PTRS_PER_PAGE : size)) {
308 if (!(page_dir = *dir)) {
309 poff = 0;
310 continue;
311 }
312 if (!(page_dir & PAGE_PRESENT)) {
313 printk("unmap_page_range: bad page directory.");
314 continue;
315 }
316 page_table = (unsigned long *)(PAGE_MASK & page_dir);
317 if (poff) {
318 page_table += poff;
319 poff = 0;
320 }
321 for (pc = pcnt; pc--; page_table++) {
322 if ((page = *page_table) != 0) {
323 *page_table = 0;
324 if (1 & page) {
325 if (!(mem_map[MAP_NR(page)] & MAP_PAGE_RESERVED))
326 if (current->mm->rss > 0)
327 --current->mm->rss;
328 free_page(PAGE_MASK & page);
329 } else
330 swap_free(page);
331 }
332 }
333 if (pcnt == PTRS_PER_PAGE) {
334 *dir = 0;
335 free_page(PAGE_MASK & page_dir);
336 }
337 }
338 invalidate();
339 return 0;
340 }
341
342 int zeromap_page_range(unsigned long from, unsigned long size, int mask)
343 {
344 unsigned long *page_table, *dir;
345 unsigned long poff, pcnt;
346 unsigned long page;
347
348 if (mask) {
349 if ((mask & (PAGE_MASK|PAGE_PRESENT)) != PAGE_PRESENT) {
350 printk("zeromap_page_range: mask = %08x\n",mask);
351 return -EINVAL;
352 }
353 mask |= ZERO_PAGE;
354 }
355 if (from & ~PAGE_MASK) {
356 printk("zeromap_page_range: from = %08lx\n",from);
357 return -EINVAL;
358 }
359 dir = PAGE_DIR_OFFSET(current->tss.cr3,from);
360 size = (size + ~PAGE_MASK) >> PAGE_SHIFT;
361 poff = (from >> PAGE_SHIFT) & (PTRS_PER_PAGE-1);
362 if ((pcnt = PTRS_PER_PAGE - poff) > size)
363 pcnt = size;
364
365 while (size > 0) {
366 if (!(PAGE_PRESENT & *dir)) {
367
368 if (!(page_table = (unsigned long*) get_free_page(GFP_KERNEL))) {
369 invalidate();
370 return -ENOMEM;
371 }
372 if (PAGE_PRESENT & *dir) {
373 free_page((unsigned long) page_table);
374 page_table = (unsigned long *)(PAGE_MASK & *dir++);
375 } else
376 *dir++ = ((unsigned long) page_table) | PAGE_TABLE;
377 } else
378 page_table = (unsigned long *)(PAGE_MASK & *dir++);
379 page_table += poff;
380 poff = 0;
381 for (size -= pcnt; pcnt-- ;) {
382 if ((page = *page_table) != 0) {
383 *page_table = 0;
384 if (page & PAGE_PRESENT) {
385 if (!(mem_map[MAP_NR(page)] & MAP_PAGE_RESERVED))
386 if (current->mm->rss > 0)
387 --current->mm->rss;
388 free_page(PAGE_MASK & page);
389 } else
390 swap_free(page);
391 }
392 *page_table++ = mask;
393 }
394 pcnt = (size > PTRS_PER_PAGE ? PTRS_PER_PAGE : size);
395 }
396 invalidate();
397 return 0;
398 }
399
400
401
402
403
404
405 int remap_page_range(unsigned long from, unsigned long to, unsigned long size, int mask)
406 {
407 unsigned long *page_table, *dir;
408 unsigned long poff, pcnt;
409 unsigned long page;
410
411 if (mask) {
412 if ((mask & (PAGE_MASK|PAGE_PRESENT)) != PAGE_PRESENT) {
413 printk("remap_page_range: mask = %08x\n",mask);
414 return -EINVAL;
415 }
416 }
417 if ((from & ~PAGE_MASK) || (to & ~PAGE_MASK)) {
418 printk("remap_page_range: from = %08lx, to=%08lx\n",from,to);
419 return -EINVAL;
420 }
421 dir = PAGE_DIR_OFFSET(current->tss.cr3,from);
422 size = (size + ~PAGE_MASK) >> PAGE_SHIFT;
423 poff = (from >> PAGE_SHIFT) & (PTRS_PER_PAGE-1);
424 if ((pcnt = PTRS_PER_PAGE - poff) > size)
425 pcnt = size;
426
427 while (size > 0) {
428 if (!(PAGE_PRESENT & *dir)) {
429
430 if (!(page_table = (unsigned long*) get_free_page(GFP_KERNEL))) {
431 invalidate();
432 return -1;
433 }
434 *dir++ = ((unsigned long) page_table) | PAGE_TABLE;
435 }
436 else
437 page_table = (unsigned long *)(PAGE_MASK & *dir++);
438 if (poff) {
439 page_table += poff;
440 poff = 0;
441 }
442
443 for (size -= pcnt; pcnt-- ;) {
444 if ((page = *page_table) != 0) {
445 *page_table = 0;
446 if (PAGE_PRESENT & page) {
447 if (!(mem_map[MAP_NR(page)] & MAP_PAGE_RESERVED))
448 if (current->mm->rss > 0)
449 --current->mm->rss;
450 free_page(PAGE_MASK & page);
451 } else
452 swap_free(page);
453 }
454
455
456
457
458
459
460
461 if (!mask)
462 *page_table++ = 0;
463 else if (to >= high_memory)
464 *page_table++ = (to | mask);
465 else if (!mem_map[MAP_NR(to)])
466 *page_table++ = 0;
467 else {
468 *page_table++ = (to | mask);
469 if (!(mem_map[MAP_NR(to)] & MAP_PAGE_RESERVED)) {
470 ++current->mm->rss;
471 mem_map[MAP_NR(to)]++;
472 }
473 }
474 to += PAGE_SIZE;
475 }
476 pcnt = (size > PTRS_PER_PAGE ? PTRS_PER_PAGE : size);
477 }
478 invalidate();
479 return 0;
480 }
481
482
483
484
485
486
487
488 unsigned long put_page(struct task_struct * tsk,unsigned long page,
489 unsigned long address,int prot)
490 {
491 unsigned long *page_table;
492
493 if ((prot & (PAGE_MASK|PAGE_PRESENT)) != PAGE_PRESENT)
494 printk("put_page: prot = %08x\n",prot);
495 if (page >= high_memory) {
496 printk("put_page: trying to put page %08lx at %08lx\n",page,address);
497 return 0;
498 }
499 page_table = PAGE_DIR_OFFSET(tsk->tss.cr3,address);
500 if ((*page_table) & PAGE_PRESENT)
501 page_table = (unsigned long *) (PAGE_MASK & *page_table);
502 else {
503 printk("put_page: bad page directory entry\n");
504 oom(tsk);
505 *page_table = BAD_PAGETABLE | PAGE_TABLE;
506 return 0;
507 }
508 page_table += (address >> PAGE_SHIFT) & (PTRS_PER_PAGE-1);
509 if (*page_table) {
510 printk("put_page: page already exists\n");
511 *page_table = 0;
512 invalidate();
513 }
514 *page_table = page | prot;
515
516 return page;
517 }
518
519
520
521
522
523
524
525 unsigned long put_dirty_page(struct task_struct * tsk, unsigned long page, unsigned long address)
526 {
527 unsigned long tmp, *page_table;
528
529 if (page >= high_memory)
530 printk("put_dirty_page: trying to put page %08lx at %08lx\n",page,address);
531 if (mem_map[MAP_NR(page)] != 1)
532 printk("mem_map disagrees with %08lx at %08lx\n",page,address);
533 page_table = PAGE_DIR_OFFSET(tsk->tss.cr3,address);
534 if (PAGE_PRESENT & *page_table)
535 page_table = (unsigned long *) (PAGE_MASK & *page_table);
536 else {
537 if (!(tmp = get_free_page(GFP_KERNEL)))
538 return 0;
539 if (PAGE_PRESENT & *page_table) {
540 free_page(tmp);
541 page_table = (unsigned long *) (PAGE_MASK & *page_table);
542 } else {
543 *page_table = tmp | PAGE_TABLE;
544 page_table = (unsigned long *) tmp;
545 }
546 }
547 page_table += (address >> PAGE_SHIFT) & (PTRS_PER_PAGE-1);
548 if (*page_table) {
549 printk("put_dirty_page: page already exists\n");
550 *page_table = 0;
551 invalidate();
552 }
553 *page_table = page | (PAGE_DIRTY | PAGE_PRIVATE);
554
555 return page;
556 }
557
558
559
560
561
562
563
564
565
566 void do_wp_page(struct vm_area_struct * vma, unsigned long address,
567 unsigned long error_code)
568 {
569 unsigned long *pde, pte, old_page, prot;
570 unsigned long new_page;
571
572 new_page = __get_free_page(GFP_KERNEL);
573 pde = PAGE_DIR_OFFSET(vma->vm_task->tss.cr3,address);
574 pte = *pde;
575 if (!(pte & PAGE_PRESENT))
576 goto end_wp_page;
577 if ((pte & PAGE_TABLE) != PAGE_TABLE || pte >= high_memory)
578 goto bad_wp_pagetable;
579 pte &= PAGE_MASK;
580 pte += PAGE_PTR(address);
581 old_page = *(unsigned long *) pte;
582 if (!(old_page & PAGE_PRESENT))
583 goto end_wp_page;
584 if (old_page >= high_memory)
585 goto bad_wp_page;
586 if (old_page & PAGE_RW)
587 goto end_wp_page;
588 vma->vm_task->mm->min_flt++;
589 prot = (old_page & ~PAGE_MASK) | PAGE_RW;
590 old_page &= PAGE_MASK;
591 if (mem_map[MAP_NR(old_page)] != 1) {
592 if (new_page) {
593 if (mem_map[MAP_NR(old_page)] & MAP_PAGE_RESERVED)
594 ++vma->vm_task->mm->rss;
595 copy_page(old_page,new_page);
596 *(unsigned long *) pte = new_page | prot;
597 free_page(old_page);
598 invalidate();
599 return;
600 }
601 free_page(old_page);
602 oom(vma->vm_task);
603 *(unsigned long *) pte = BAD_PAGE | prot;
604 invalidate();
605 return;
606 }
607 *(unsigned long *) pte |= PAGE_RW;
608 invalidate();
609 if (new_page)
610 free_page(new_page);
611 return;
612 bad_wp_page:
613 printk("do_wp_page: bogus page at address %08lx (%08lx)\n",address,old_page);
614 *(unsigned long *) pte = BAD_PAGE | PAGE_SHARED;
615 send_sig(SIGKILL, vma->vm_task, 1);
616 goto end_wp_page;
617 bad_wp_pagetable:
618 printk("do_wp_page: bogus page-table at address %08lx (%08lx)\n",address,pte);
619 *pde = BAD_PAGETABLE | PAGE_TABLE;
620 send_sig(SIGKILL, vma->vm_task, 1);
621 end_wp_page:
622 if (new_page)
623 free_page(new_page);
624 return;
625 }
626
627
628
629
630 int verify_area(int type, const void * addr, unsigned long size)
631 {
632 struct vm_area_struct * vma;
633 unsigned long start = (unsigned long) addr;
634
635
636
637
638
639 if (get_fs() == get_ds())
640 return 0;
641
642 for (vma = current->mm->mmap ; ; vma = vma->vm_next) {
643 if (!vma)
644 goto bad_area;
645 if (vma->vm_end > start)
646 break;
647 }
648 if (vma->vm_start <= start)
649 goto good_area;
650 if (!(vma->vm_flags & VM_GROWSDOWN))
651 goto bad_area;
652 if (vma->vm_end - start > current->rlim[RLIMIT_STACK].rlim_cur)
653 goto bad_area;
654
655 good_area:
656 if (!wp_works_ok && type == VERIFY_WRITE)
657 goto check_wp_fault_by_hand;
658 for (;;) {
659 struct vm_area_struct * next;
660 if (type != VERIFY_READ && !(vma->vm_page_prot & (PAGE_COW | PAGE_RW)))
661 goto bad_area;
662 if (vma->vm_end - start >= size)
663 return 0;
664 next = vma->vm_next;
665 if (!next || vma->vm_end != next->vm_start)
666 goto bad_area;
667 vma = next;
668 }
669
670 check_wp_fault_by_hand:
671 size--;
672 size += start & ~PAGE_MASK;
673 size >>= PAGE_SHIFT;
674 start &= PAGE_MASK;
675
676 for (;;) {
677 if (!(vma->vm_page_prot & (PAGE_COW | PAGE_RW)))
678 goto bad_area;
679 do_wp_page(vma, start, PAGE_PRESENT);
680 if (!size)
681 return 0;
682 size--;
683 start += PAGE_SIZE;
684 if (start < vma->vm_end)
685 continue;
686 vma = vma->vm_next;
687 if (!vma || vma->vm_start != start)
688 break;
689 }
690
691 bad_area:
692 return -EFAULT;
693 }
694
695 static inline void get_empty_page(struct task_struct * tsk, unsigned long address)
696 {
697 unsigned long tmp;
698
699 if (!(tmp = get_free_page(GFP_KERNEL))) {
700 oom(tsk);
701 tmp = BAD_PAGE;
702 }
703 if (!put_page(tsk,tmp,address,PAGE_PRIVATE))
704 free_page(tmp);
705 }
706
707
708
709
710
711
712
713
714
715 static int try_to_share(unsigned long to_address, struct vm_area_struct * to_area,
716 unsigned long from_address, struct vm_area_struct * from_area,
717 unsigned long newpage)
718 {
719 unsigned long from;
720 unsigned long to;
721 unsigned long from_page;
722 unsigned long to_page;
723
724 from_page = (unsigned long)PAGE_DIR_OFFSET(from_area->vm_task->tss.cr3,from_address);
725 to_page = (unsigned long)PAGE_DIR_OFFSET(to_area->vm_task->tss.cr3,to_address);
726
727 from = *(unsigned long *) from_page;
728 if (!(from & PAGE_PRESENT))
729 return 0;
730 from &= PAGE_MASK;
731 from_page = from + PAGE_PTR(from_address);
732 from = *(unsigned long *) from_page;
733
734 if (!(from & PAGE_PRESENT))
735 return 0;
736
737 if ((from_area->vm_page_prot & PAGE_COW) && (from & PAGE_DIRTY))
738 return 0;
739
740 if (from >= high_memory)
741 return 0;
742 if (mem_map[MAP_NR(from)] & MAP_PAGE_RESERVED)
743 return 0;
744
745 to = *(unsigned long *) to_page;
746 if (!(to & PAGE_PRESENT))
747 return 0;
748 to &= PAGE_MASK;
749 to_page = to + PAGE_PTR(to_address);
750 if (*(unsigned long *) to_page)
751 return 0;
752
753 if (newpage) {
754 if (in_swap_cache(from)) {
755 if (from_area->vm_page_prot & PAGE_COW)
756 return 0;
757 }
758 copy_page((from & PAGE_MASK), newpage);
759 *(unsigned long *) to_page = newpage | to_area->vm_page_prot;
760 return 1;
761 }
762
763 if (in_swap_cache(from)) {
764 if (from_area->vm_page_prot & PAGE_COW)
765 return 0;
766 from |= PAGE_DIRTY;
767 *(unsigned long *) from_page = from;
768 swap_cache_invalidate(from);
769 invalidate();
770 }
771 mem_map[MAP_NR(from)]++;
772
773 to = (from & (PAGE_MASK | PAGE_DIRTY)) | to_area->vm_page_prot;
774 if (to & PAGE_COW)
775 to &= ~PAGE_RW;
776 *(unsigned long *) to_page = to;
777
778 if (!(from & PAGE_RW))
779 return 1;
780 if (!(from_area->vm_page_prot & PAGE_COW))
781 return 1;
782
783 from &= ~PAGE_RW;
784 *(unsigned long *) from_page = from;
785 invalidate();
786 return 1;
787 }
788
789
790
791
792
793
794
795
796 static int share_page(struct vm_area_struct * area, unsigned long address,
797 unsigned long error_code, unsigned long newpage)
798 {
799 struct inode * inode;
800 struct task_struct ** p;
801 unsigned long offset;
802 unsigned long from_address;
803 unsigned long give_page;
804
805 if (!area || !(inode = area->vm_inode) || inode->i_count < 2)
806 return 0;
807
808 give_page = 0;
809 if ((area->vm_page_prot & PAGE_COW) && (error_code & PAGE_RW)) {
810 if (!newpage)
811 return 0;
812 give_page = newpage;
813 }
814 offset = address - area->vm_start + area->vm_offset;
815 for (p = &LAST_TASK ; p > &FIRST_TASK ; --p) {
816 struct vm_area_struct * mpnt;
817 if (!*p)
818 continue;
819 if (area->vm_task == *p)
820 continue;
821
822
823 for (mpnt = (*p)->mm->mmap; mpnt; mpnt = mpnt->vm_next) {
824
825 if (mpnt->vm_inode != inode)
826 continue;
827
828 if ((mpnt->vm_offset ^ area->vm_offset) & ~PAGE_MASK)
829 continue;
830
831 from_address = offset + mpnt->vm_start - mpnt->vm_offset;
832 if (from_address < mpnt->vm_start || from_address >= mpnt->vm_end)
833 continue;
834
835 if (!try_to_share(address, area, from_address, mpnt, give_page))
836 continue;
837
838 if (give_page || !newpage)
839 return 1;
840 free_page(newpage);
841 return 1;
842 }
843 }
844 return 0;
845 }
846
847
848
849
850 static inline unsigned long get_empty_pgtable(struct task_struct * tsk,unsigned long address)
851 {
852 unsigned long page;
853 unsigned long *p;
854
855 p = PAGE_DIR_OFFSET(tsk->tss.cr3,address);
856 if (PAGE_PRESENT & *p)
857 return *p;
858 if (*p) {
859 printk("get_empty_pgtable: bad page-directory entry \n");
860 *p = 0;
861 }
862 page = get_free_page(GFP_KERNEL);
863 p = PAGE_DIR_OFFSET(tsk->tss.cr3,address);
864 if (PAGE_PRESENT & *p) {
865 free_page(page);
866 return *p;
867 }
868 if (*p) {
869 printk("get_empty_pgtable: bad page-directory entry \n");
870 *p = 0;
871 }
872 if (page) {
873 *p = page | PAGE_TABLE;
874 return *p;
875 }
876 oom(current);
877 *p = BAD_PAGETABLE | PAGE_TABLE;
878 return 0;
879 }
880
881 static inline void do_swap_page(struct vm_area_struct * vma,
882 unsigned long address, unsigned long * pge, unsigned long entry)
883 {
884 unsigned long page;
885
886 if (vma->vm_ops && vma->vm_ops->swapin)
887 page = vma->vm_ops->swapin(vma, entry);
888 else
889 page = swap_in(entry);
890 if (*pge != entry) {
891 free_page(page);
892 return;
893 }
894 page = page | vma->vm_page_prot;
895 if (mem_map[MAP_NR(page)] > 1 && (page & PAGE_COW))
896 page &= ~PAGE_RW;
897 ++vma->vm_task->mm->rss;
898 ++vma->vm_task->mm->maj_flt;
899 *pge = page;
900 return;
901 }
902
903 void do_no_page(struct vm_area_struct * vma, unsigned long address,
904 unsigned long error_code)
905 {
906 unsigned long page, entry, prot;
907
908 page = get_empty_pgtable(vma->vm_task,address);
909 if (!page)
910 return;
911 page &= PAGE_MASK;
912 page += PAGE_PTR(address);
913 entry = *(unsigned long *) page;
914 if (entry & PAGE_PRESENT)
915 return;
916 if (entry) {
917 do_swap_page(vma, address, (unsigned long *) page, entry);
918 return;
919 }
920 address &= PAGE_MASK;
921
922 if (!vma->vm_ops || !vma->vm_ops->nopage) {
923 ++vma->vm_task->mm->rss;
924 ++vma->vm_task->mm->min_flt;
925 get_empty_page(vma->vm_task,address);
926 return;
927 }
928 page = get_free_page(GFP_KERNEL);
929 if (share_page(vma, address, error_code, page)) {
930 ++vma->vm_task->mm->min_flt;
931 ++vma->vm_task->mm->rss;
932 return;
933 }
934 if (!page) {
935 oom(current);
936 put_page(vma->vm_task, BAD_PAGE, address, PAGE_PRIVATE);
937 return;
938 }
939 ++vma->vm_task->mm->maj_flt;
940 ++vma->vm_task->mm->rss;
941 prot = vma->vm_page_prot;
942
943
944
945
946
947 page = vma->vm_ops->nopage(vma, address, page, (error_code & PAGE_RW) && (prot & PAGE_COW));
948 if (share_page(vma, address, error_code, 0)) {
949 free_page(page);
950 return;
951 }
952
953
954
955
956 if (error_code & PAGE_RW) {
957 prot |= PAGE_DIRTY;
958 } else if ((prot & PAGE_COW) && mem_map[MAP_NR(page)] > 1)
959 prot &= ~PAGE_RW;
960 if (put_page(vma->vm_task, page, address, prot))
961 return;
962 free_page(page);
963 oom(current);
964 }
965
966
967
968
969
970
971 asmlinkage void do_page_fault(struct pt_regs *regs, unsigned long error_code)
972 {
973 struct vm_area_struct * vma;
974 unsigned long address;
975 unsigned long page;
976
977
978 __asm__("movl %%cr2,%0":"=r" (address));
979 for (vma = current->mm->mmap ; ; vma = vma->vm_next) {
980 if (!vma)
981 goto bad_area;
982 if (vma->vm_end > address)
983 break;
984 }
985 if (vma->vm_start <= address)
986 goto good_area;
987 if (!(vma->vm_flags & VM_GROWSDOWN))
988 goto bad_area;
989 if (vma->vm_end - address > current->rlim[RLIMIT_STACK].rlim_cur)
990 goto bad_area;
991 vma->vm_offset -= vma->vm_start - (address & PAGE_MASK);
992 vma->vm_start = (address & PAGE_MASK);
993
994
995
996
997 good_area:
998 if (regs->eflags & VM_MASK) {
999 unsigned long bit = (address - 0xA0000) >> PAGE_SHIFT;
1000 if (bit < 32)
1001 current->screen_bitmap |= 1 << bit;
1002 }
1003 if (error_code & PAGE_PRESENT) {
1004 if ((vma->vm_page_prot & (PAGE_RW | PAGE_COW | PAGE_PRESENT)) == PAGE_PRESENT)
1005 goto bad_area;
1006 #ifdef CONFIG_TEST_VERIFY_AREA
1007 if (regs->cs == KERNEL_CS)
1008 printk("WP fault at %08x\n", regs->eip);
1009 #endif
1010 do_wp_page(vma, address, error_code);
1011 return;
1012 }
1013 if (!(vma->vm_page_prot & PAGE_PRESENT))
1014 goto bad_area;
1015 do_no_page(vma, address, error_code);
1016 return;
1017
1018
1019
1020
1021
1022 bad_area:
1023 if (error_code & PAGE_USER) {
1024 current->tss.cr2 = address;
1025 current->tss.error_code = error_code;
1026 current->tss.trap_no = 14;
1027 send_sig(SIGSEGV, current, 1);
1028 return;
1029 }
1030
1031
1032
1033
1034 if (wp_works_ok < 0 && address == TASK_SIZE && (error_code & PAGE_PRESENT)) {
1035 wp_works_ok = 1;
1036 pg0[0] = PAGE_SHARED;
1037 printk("This processor honours the WP bit even when in supervisor mode. Good.\n");
1038 return;
1039 }
1040 if ((unsigned long) (address-TASK_SIZE) < PAGE_SIZE) {
1041 printk(KERN_ALERT "Unable to handle kernel NULL pointer dereference");
1042 pg0[0] = PAGE_SHARED;
1043 } else
1044 printk(KERN_ALERT "Unable to handle kernel paging request");
1045 printk(" at virtual address %08lx\n",address);
1046 __asm__("movl %%cr3,%0" : "=r" (page));
1047 printk(KERN_ALERT "current->tss.cr3 = %08lx, %%cr3 = %08lx\n",
1048 current->tss.cr3, page);
1049 page = ((unsigned long *) page)[address >> 22];
1050 printk(KERN_ALERT "*pde = %08lx\n", page);
1051 if (page & PAGE_PRESENT) {
1052 page &= PAGE_MASK;
1053 address &= 0x003ff000;
1054 page = ((unsigned long *) page)[address >> PAGE_SHIFT];
1055 printk(KERN_ALERT "*pte = %08lx\n", page);
1056 }
1057 die_if_kernel("Oops", regs, error_code);
1058 do_exit(SIGKILL);
1059 }
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074 unsigned long __bad_pagetable(void)
1075 {
1076 extern char empty_bad_page_table[PAGE_SIZE];
1077
1078 __asm__ __volatile__("cld ; rep ; stosl":
1079 :"a" (BAD_PAGE + PAGE_TABLE),
1080 "D" ((long) empty_bad_page_table),
1081 "c" (PTRS_PER_PAGE)
1082 :"di","cx");
1083 return (unsigned long) empty_bad_page_table;
1084 }
1085
1086 unsigned long __bad_page(void)
1087 {
1088 extern char empty_bad_page[PAGE_SIZE];
1089
1090 __asm__ __volatile__("cld ; rep ; stosl":
1091 :"a" (0),
1092 "D" ((long) empty_bad_page),
1093 "c" (PTRS_PER_PAGE)
1094 :"di","cx");
1095 return (unsigned long) empty_bad_page;
1096 }
1097
1098 unsigned long __zero_page(void)
1099 {
1100 extern char empty_zero_page[PAGE_SIZE];
1101
1102 __asm__ __volatile__("cld ; rep ; stosl":
1103 :"a" (0),
1104 "D" ((long) empty_zero_page),
1105 "c" (PTRS_PER_PAGE)
1106 :"di","cx");
1107 return (unsigned long) empty_zero_page;
1108 }
1109
1110 void show_mem(void)
1111 {
1112 int i,free = 0,total = 0,reserved = 0;
1113 int shared = 0;
1114
1115 printk("Mem-info:\n");
1116 show_free_areas();
1117 printk("Free swap: %6dkB\n",nr_swap_pages<<(PAGE_SHIFT-10));
1118 i = high_memory >> PAGE_SHIFT;
1119 while (i-- > 0) {
1120 total++;
1121 if (mem_map[i] & MAP_PAGE_RESERVED)
1122 reserved++;
1123 else if (!mem_map[i])
1124 free++;
1125 else
1126 shared += mem_map[i]-1;
1127 }
1128 printk("%d pages of RAM\n",total);
1129 printk("%d free pages\n",free);
1130 printk("%d reserved pages\n",reserved);
1131 printk("%d pages shared\n",shared);
1132 show_buffers();
1133 #ifdef CONFIG_NET
1134 show_net_buffers();
1135 #endif
1136 }
1137
1138 extern unsigned long free_area_init(unsigned long, unsigned long);
1139
1140
1141
1142
1143
1144
1145
1146
1147 unsigned long paging_init(unsigned long start_mem, unsigned long end_mem)
1148 {
1149 unsigned long * pg_dir;
1150 unsigned long * pg_table;
1151 unsigned long tmp;
1152 unsigned long address;
1153
1154
1155
1156
1157
1158
1159
1160 #if 0
1161 memset((void *) 0, 0, PAGE_SIZE);
1162 #endif
1163 start_mem = PAGE_ALIGN(start_mem);
1164 address = 0;
1165 pg_dir = swapper_pg_dir;
1166 while (address < end_mem) {
1167 tmp = *(pg_dir + 768);
1168 if (!tmp) {
1169 tmp = start_mem | PAGE_TABLE;
1170 *(pg_dir + 768) = tmp;
1171 start_mem += PAGE_SIZE;
1172 }
1173 *pg_dir = tmp;
1174 pg_dir++;
1175 pg_table = (unsigned long *) (tmp & PAGE_MASK);
1176 for (tmp = 0 ; tmp < PTRS_PER_PAGE ; tmp++,pg_table++) {
1177 if (address < end_mem)
1178 *pg_table = address | PAGE_SHARED;
1179 else
1180 *pg_table = 0;
1181 address += PAGE_SIZE;
1182 }
1183 }
1184 invalidate();
1185 return free_area_init(start_mem, end_mem);
1186 }
1187
1188 void mem_init(unsigned long start_low_mem,
1189 unsigned long start_mem, unsigned long end_mem)
1190 {
1191 int codepages = 0;
1192 int reservedpages = 0;
1193 int datapages = 0;
1194 unsigned long tmp;
1195 extern int etext;
1196
1197 cli();
1198 end_mem &= PAGE_MASK;
1199 high_memory = end_mem;
1200
1201
1202 start_low_mem = PAGE_ALIGN(start_low_mem);
1203 start_mem = PAGE_ALIGN(start_mem);
1204
1205
1206
1207
1208
1209
1210 while (start_low_mem < 0x9f000) {
1211 mem_map[MAP_NR(start_low_mem)] = 0;
1212 start_low_mem += PAGE_SIZE;
1213 }
1214
1215 while (start_mem < high_memory) {
1216 mem_map[MAP_NR(start_mem)] = 0;
1217 start_mem += PAGE_SIZE;
1218 }
1219 #ifdef CONFIG_SOUND
1220 sound_mem_init();
1221 #endif
1222 for (tmp = 0 ; tmp < high_memory ; tmp += PAGE_SIZE) {
1223 if (mem_map[MAP_NR(tmp)]) {
1224 if (tmp >= 0xA0000 && tmp < 0x100000)
1225 reservedpages++;
1226 else if (tmp < (unsigned long) &etext)
1227 codepages++;
1228 else
1229 datapages++;
1230 continue;
1231 }
1232 mem_map[MAP_NR(tmp)] = 1;
1233 free_page(tmp);
1234 }
1235 tmp = nr_free_pages << PAGE_SHIFT;
1236 printk("Memory: %luk/%luk available (%dk kernel code, %dk reserved, %dk data)\n",
1237 tmp >> 10,
1238 high_memory >> 10,
1239 codepages << (PAGE_SHIFT-10),
1240 reservedpages << (PAGE_SHIFT-10),
1241 datapages << (PAGE_SHIFT-10));
1242
1243 wp_works_ok = -1;
1244 pg0[0] = PAGE_READONLY;
1245 invalidate();
1246 __asm__ __volatile__("movb 0,%%al ; movb %%al,0": : :"ax", "memory");
1247 pg0[0] = 0;
1248 invalidate();
1249 if (wp_works_ok < 0)
1250 wp_works_ok = 0;
1251 #ifdef CONFIG_TEST_VERIFY_AREA
1252 wp_works_ok = 0;
1253 #endif
1254 return;
1255 }
1256
1257 void si_meminfo(struct sysinfo *val)
1258 {
1259 int i;
1260
1261 i = high_memory >> PAGE_SHIFT;
1262 val->totalram = 0;
1263 val->sharedram = 0;
1264 val->freeram = nr_free_pages << PAGE_SHIFT;
1265 val->bufferram = buffermem;
1266 while (i-- > 0) {
1267 if (mem_map[i] & MAP_PAGE_RESERVED)
1268 continue;
1269 val->totalram++;
1270 if (!mem_map[i])
1271 continue;
1272 val->sharedram += mem_map[i]-1;
1273 }
1274 val->totalram <<= PAGE_SHIFT;
1275 val->sharedram <<= PAGE_SHIFT;
1276 return;
1277 }
1278
1279
1280
1281
1282
1283 static unsigned long file_mmap_nopage(struct vm_area_struct * area, unsigned long address,
1284 unsigned long page, int no_share)
1285 {
1286 struct inode * inode = area->vm_inode;
1287 unsigned int block;
1288 int nr[8];
1289 int i, *p;
1290
1291 address &= PAGE_MASK;
1292 block = address - area->vm_start + area->vm_offset;
1293 block >>= inode->i_sb->s_blocksize_bits;
1294 i = PAGE_SIZE >> inode->i_sb->s_blocksize_bits;
1295 p = nr;
1296 do {
1297 *p = bmap(inode,block);
1298 i--;
1299 block++;
1300 p++;
1301 } while (i > 0);
1302 return bread_page(page, inode->i_dev, nr, inode->i_sb->s_blocksize, no_share);
1303 }
1304
1305 struct vm_operations_struct file_mmap = {
1306 NULL,
1307 NULL,
1308 file_mmap_nopage,
1309 NULL,
1310 NULL,
1311 NULL,
1312 };