1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
|
#include "kernel.h"
// http://www.intel.com/content/dam/doc/specification-update/64-architecture-x2apic-specification.pdf
// http://download.intel.com/design/chipsets/datashts/29056601.pdf
// http://www.scs.stanford.edu/05au-cs240c/lab/ia32/IA32-3.pdf
// https://wiki.osdev.org/Symmetric_Multiprocessing
// https://wiki.osdev.org/APIC_timer
#include <stdint.h>
#include "smp.h"
#include "gdt.h"
#include "mem.h"
#include "interrupts.h"
#include "kmalloc.h"
#include "spinlock.h"
#include "asm_x86.h"
#include "asm_pit.h"
#include "asm_mp.h"
#define APIC_APICID 0x20
#define APIC_APICVER 0x30
#define APIC_TASKPRIOR 0x80
#define APIC_EOI 0x0B0
#define APIC_LDR 0x0D0
#define APIC_DFR 0x0E0
#define APIC_SPURIOUS 0x0F0
#define APIC_ESR 0x280
#define APIC_ICRL 0x300
#define APIC_ICRH 0x310
#define APIC_LVT_TMR 0x320
#define APIC_LVT_PERF 0x340
#define APIC_LVT_LINT0 0x350
#define APIC_LVT_LINT1 0x360
#define APIC_LVT_ERR 0x370
#define APIC_TMRINITCNT 0x380
#define APIC_TMRCURRCNT 0x390
#define APIC_TMRDIV 0x3E0
#define APIC_LAST 0x38F
#define APIC_DISABLE 0x10000
#define APIC_SW_ENABLE 0x100
#define APIC_CPUFOCUS 0x200
#define APIC_NMI (4<<8)
#define TMR_PERIODIC 0x20000
#define TMR_BASEDIV (1<<20)
// some multiprocessor shit that should move away TODO
uint32_t c1,c2,c3;
volatile uint8_t proc;
uint32_t cpu_counter[SMP_MAX_PROC];
uint32_t local_apic_addr;
uint32_t io_apic_addr;
uint32_t countdown;
void writeIOAPIC(uint32_t offset, uint32_t value)
{
uint32_t *reg=io_apic_addr;
reg[0]=(offset & 0xff);
reg[4]= value;
}
uint32_t readIOAPIC(uint32_t offset)
{
uint32_t *reg=io_apic_addr;
reg[0]=(offset & 0xff);
return reg[4];
}
void irqIOAPIC(uint32_t irq, uint32_t low, uint32_t high)
{
writeIOAPIC(0x10+irq*2,low);
writeIOAPIC(0x11+irq*2,high);
}
void writeAPIC(uint32_t offset, uint32_t value)
{
uint32_t *reg;
reg=local_apic_addr+offset;
*reg=value;
}
uint32_t readAPIC(uint32_t offset)
{
uint32_t *reg;
reg=local_apic_addr+offset;
uint32_t value=*reg;
return value;
}
uint32_t apicID()
{
return readAPIC(APIC_APICID);
}
void apicEOI()
{
writeAPIC(0xB0,0);
}
void apicIPI(uint8_t dest, uint8_t number)
{
writeAPIC(APIC_ICRH,dest<<24); // destination apic bits 24-27
writeAPIC(APIC_ICRL,number | (1<<14)); // send ipi
}
void apicEnable()
{
writeAPIC(APIC_SPURIOUS,readAPIC(APIC_SPURIOUS)|0x100);
}
/** select mode : divisor.
* 0 - 1
* 1 - 2
* 2 - 4
* 3 - 8
* 4 - 16
* 5 - 32
* 6 - 64
* 7 - 128
*/
uint32_t probeBusSpeed(uint32_t sel)
{
uint32_t div[]={1,2,4,8,16,32,64,128};
uint32_t reg[]={0b1011,0,1,2,3,0b1000,0b1001,0b1010};
uint32_t divisor=div[sel];
klog("Probing bus speed for 50ms (div=%d)) ...",divisor);
writeAPIC(APIC_TMRDIV, reg[sel]);
writeAPIC(APIC_TMRINITCNT, 0xFFFFFFFF);
// for(int i=0;i<20;i++)
asm_pit_sleep_50ms();
//writeAPIC(APIC_LVT_TMR, APIC_LVT_INT_MASKED); //??
uint32_t ticksInS = 0xFFFFFFFF - readAPIC(APIC_TMRCURRCNT);
ticksInS*=20; // adjust to one full second.
klog("%d MHz (%d Hz) bus speed (ticks=%d)",ticksInS/(1000000/divisor),ticksInS*divisor,ticksInS/20);
return ticksInS*divisor;
}
void smp_main()
{
// setup stack
uint32_t ebp=kballoc(1);
asm volatile("mov %0, %%ebp"::"r"(ebp));
asm volatile("mov %ebp, %esp");
asm volatile("jmp kernel_ap");
}
void kernel_ap()
{
klog("smp local apic id: 0x%08X",apicID());
apicEnable();
interrupts_install();
gdt_init();
writeAPIC(APIC_TMRDIV, 0x3);
writeAPIC(APIC_LVT_TMR,INTERRUPT_APIC_TIMER | TMR_PERIODIC);
writeAPIC(APIC_TMRINITCNT, countdown);
x86_sti();
asm_smp_unlock();
while(1)
{
asm("hlt");
klog("tack: 0x%08X: 0x%08X",readAPIC(APIC_APICID), readAPIC(APIC_TMRCURRCNT));
}
// switch_to_user_mode();
/*
while(1);
uint32_t ebp=pmmngr_alloc_block()+4095;
asm volatile("mov %0, %%ebp"::"r"(ebp));
asm volatile("mov %ebp, %esp");
asm volatile("jmp kernel_ap");
proc=c1=c2=c3=0;
for(int i=0;i<SMP_MAX_PROC;i++)cpu_counter[i]=0;
*/
}
void kernel_ap_old()
{
proc++;
uint8_t p=proc;
while(1)
{
cpu_counter[p]++;
//lock_spin(0);
if(cpu_counter[p]%1000000==0)klog("cpu[%d] %d",p,cpu_counter[p]);
//lock_release(0);
}
}
// this will start all our application processors!
void smp_start_aps(smp_processors *pros)
{
// TODO: check if local APIC is present via CPUID (P6 (i686) and above)
local_apic_addr=pros->local_apic_address;
io_apic_addr=pros->io_apic_address;
klog("bsp local apic id: 0x%08X",apicID());
apicEnable(); // bsp apic seems to be enabled anyway.
uint32_t speed=probeBusSpeed(4); // get bus speed (divisor: 16)
// setup apic timer
countdown=speed/16; // tick once a second
writeAPIC(APIC_TMRDIV, 0x3); // divisor 16
writeAPIC(APIC_LVT_TMR, INTERRUPT_APIC_TIMER | TMR_PERIODIC); // on interrupt 200
writeAPIC(APIC_TMRINITCNT, countdown);
// setup IO APIC
// PIT irq 00 -> 02 flags 0 -> 0x90
// kb irq 01 -> 01 flags ? -> 0x91
// mouse irq 12 -> 12 flags ? -> 0x92
irqIOAPIC(2,0x90,0x0);
irqIOAPIC(1,0x91,0x0);
irqIOAPIC(12,0x92,0x0);
for(int i=0;i<pros->processors;i++)
{
if(pros->boot==i)continue;
uint8_t dest=pros->local_apic_id[i];
klog("starting cpu %d (dest: %d) ",i,dest);
uint32_t *reg;
reg=local_apic_addr+APIC_ICRH;
*reg=dest<<24; // destination apic.
reg=local_apic_addr+APIC_ICRL;
*reg=(5<<8)|(1<<14); // 101 INIT IPI
// TODO: wait 10 milliseconds
// https://wiki.osdev.org/Symmetric_Multiprocessing
*reg=(6<<8)|(1<<14)|0x7; // 110 SIPI
// TODO: poll a flag?(timeout 1ms)
// TODO retry 110 SIPI with 1s timeout
}
}
|