summaryrefslogtreecommitdiff
path: root/faq/context_switch.mdwn
blob: 2d090c4c9e9c8a027a1c8a0f2de3cd62db722880 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
[[!meta copyright="Copyright © 2013, 2016, 2017, 2018 Free Software Foundation,
Inc."]]

[[!meta license="""[[!toggle id="license" text="GFDL 1.2+"]][[!toggleable
id="license" text="Permission is granted to copy, distribute and/or modify this
document under the terms of the GNU Free Documentation License, Version 1.2 or
any later version published by the Free Software Foundation; with no Invariant
Sections, no Front-Cover Texts, and no Back-Cover Texts.  A copy of the license
is included in the section entitled [[GNU Free Documentation
License|/fdl]]."]]"""]]

[[!tag faq/support]]

[[!meta title="I heard that context-switch on Mach is really slow?"]]

It is not, there is no real reason why it would be particularly slow, it is just
about switching virtual addresses and registers, which all OS have to perform
anyway.

A quick-and-dirty benchmark:

        #include <fcntl.h>
        #include <semaphore.h>
        #include <stdio.h>
        #include <time.h>
        #include <unistd.h>
        #include <sys/mman.h>
        
        sem_t *sem1, *sem2;
        
        void worker1(void) {
        	time_t last;
        	int n = 0;
        	last = time(NULL);
        	while(1) {
        		time_t new = time(NULL);
        		if (new != last) {
        			printf("%d\n", n);
        			n = 0;
        			last = new;
        		}
        		n++;
        		sem_wait(sem1);
        		sem_post(sem2);
        	}
        }
        
        void worker2(void) {
        	while(1) {
        		sem_post(sem1);
        		sem_wait(sem2);
        	}
        }
        
        int fd;
        void get_sems(void) {
        	void *ptr = mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
        	sem1 = ptr;
        	sem2 = sem1+1;
        }
        
        int main(void) {
        	fd = open("/tmp/foo", O_CREAT|O_TRUNC|O_RDWR, 0666);
        	ftruncate(fd, 4096);
        
        	get_sems();
        	sem_init(sem1, 1, 0);
        	sem_init(sem2, 1, 0);
        
        	if (fork())
        		worker1();
        	else {
        		get_sems();
        		worker2();
        	}
        }

run on my current Linux system (a Core i5-10210U), gets about 300k switches per second on Linux. Running it on Hurd-in-kvm (which would supposedly be slower) gets about 400k switches per second.