Subversion Repositories HelenOS-historic

Rev

Rev 993 | Rev 1053 | Go to most recent revision | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
52 vana 1
/*
92 jermar 2
 * Copyright (C) 2005 Jakub Vana
3
 * All rights reserved.
4
 *
5
 * Redistribution and use in source and binary forms, with or without
6
 * modification, are permitted provided that the following conditions
7
 * are met:
8
 *
9
 * - Redistributions of source code must retain the above copyright
10
 *   notice, this list of conditions and the following disclaimer.
11
 * - Redistributions in binary form must reproduce the above copyright
12
 *   notice, this list of conditions and the following disclaimer in the
13
 *   documentation and/or other materials provided with the distribution.
14
 * - The name of the author may not be used to endorse or promote products
15
 *   derived from this software without specific prior written permission.
16
 *
17
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19
 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20
 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21
 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26
 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
 *
28
 */
52 vana 29
 
30
#include <fpu_context.h>
1023 vana 31
#include <arch/register.h>
993 jermar 32
#include <print.h>
52 vana 33
 
979 vana 34
void fpu_context_save(fpu_context_t *fctx){
35
		asm volatile(
36
			"stf.spill [%2]=f2,0x80\n"
37
			"stf.spill [%3]=f3,0x80\n"
38
			"stf.spill [%4]=f4,0x80\n"
39
			"stf.spill [%5]=f5,0x80\n"
40
			"stf.spill [%6]=f6,0x80\n"
41
			"stf.spill [%7]=f7,0x80\n;;"
42
 
43
			"stf.spill [%0]=f8,0x80\n"
44
			"stf.spill [%1]=f9,0x80\n"
45
			"stf.spill [%2]=f10,0x80\n"
46
			"stf.spill [%3]=f11,0x80\n"
47
			"stf.spill [%4]=f12,0x80\n"
48
			"stf.spill [%5]=f13,0x80\n"
49
			"stf.spill [%6]=f14,0x80\n"
50
			"stf.spill [%7]=f15,0x80\n;;"
51
 
52
			"stf.spill [%0]=f16,0x80\n"
53
			"stf.spill [%1]=f17,0x80\n"
54
			"stf.spill [%2]=f18,0x80\n"
55
			"stf.spill [%3]=f19,0x80\n"
56
			"stf.spill [%4]=f20,0x80\n"
57
			"stf.spill [%5]=f21,0x80\n"
58
			"stf.spill [%6]=f22,0x80\n"
59
			"stf.spill [%7]=f23,0x80\n;;"
60
 
61
			"stf.spill [%0]=f24,0x80\n"
62
			"stf.spill [%1]=f25,0x80\n"
63
			"stf.spill [%2]=f26,0x80\n"
64
			"stf.spill [%3]=f27,0x80\n"
65
			"stf.spill [%4]=f28,0x80\n"
66
			"stf.spill [%5]=f29,0x80\n"
67
			"stf.spill [%6]=f30,0x80\n"
68
			"stf.spill [%7]=f31,0x80\n;;"
69
 
70
 
71
			"stf.spill [%0]=f32,0x80\n"
72
			"stf.spill [%1]=f33,0x80\n"
73
			"stf.spill [%2]=f34,0x80\n"
74
			"stf.spill [%3]=f35,0x80\n"
75
			"stf.spill [%4]=f36,0x80\n"
76
			"stf.spill [%5]=f37,0x80\n"
77
			"stf.spill [%6]=f38,0x80\n"
78
			"stf.spill [%7]=f39,0x80\n;;"
79
 
80
			"stf.spill [%0]=f40,0x80\n"
81
			"stf.spill [%1]=f41,0x80\n"
82
			"stf.spill [%2]=f42,0x80\n"
83
			"stf.spill [%3]=f43,0x80\n"
84
			"stf.spill [%4]=f44,0x80\n"
85
			"stf.spill [%5]=f45,0x80\n"
86
			"stf.spill [%6]=f46,0x80\n"
87
			"stf.spill [%7]=f47,0x80\n;;"
88
 
89
			"stf.spill [%0]=f48,0x80\n"
90
			"stf.spill [%1]=f49,0x80\n"
91
			"stf.spill [%2]=f50,0x80\n"
92
			"stf.spill [%3]=f51,0x80\n"
93
			"stf.spill [%4]=f52,0x80\n"
94
			"stf.spill [%5]=f53,0x80\n"
95
			"stf.spill [%6]=f54,0x80\n"
96
			"stf.spill [%7]=f55,0x80\n;;"
97
 
98
			"stf.spill [%0]=f56,0x80\n"
99
			"stf.spill [%1]=f57,0x80\n"
100
			"stf.spill [%2]=f58,0x80\n"
101
			"stf.spill [%3]=f59,0x80\n"
102
			"stf.spill [%4]=f60,0x80\n"
103
			"stf.spill [%5]=f61,0x80\n"
104
			"stf.spill [%6]=f62,0x80\n"
105
			"stf.spill [%7]=f63,0x80\n;;"
106
 
107
			"stf.spill [%0]=f64,0x80\n"
108
			"stf.spill [%1]=f65,0x80\n"
109
			"stf.spill [%2]=f66,0x80\n"
110
			"stf.spill [%3]=f67,0x80\n"
111
			"stf.spill [%4]=f68,0x80\n"
112
			"stf.spill [%5]=f69,0x80\n"
113
			"stf.spill [%6]=f70,0x80\n"
114
			"stf.spill [%7]=f71,0x80\n;;"
115
 
116
			"stf.spill [%0]=f72,0x80\n"
117
			"stf.spill [%1]=f73,0x80\n"
118
			"stf.spill [%2]=f74,0x80\n"
119
			"stf.spill [%3]=f75,0x80\n"
120
			"stf.spill [%4]=f76,0x80\n"
121
			"stf.spill [%5]=f77,0x80\n"
122
			"stf.spill [%6]=f78,0x80\n"
123
			"stf.spill [%7]=f79,0x80\n;;"
124
 
125
			"stf.spill [%0]=f80,0x80\n"
126
			"stf.spill [%1]=f81,0x80\n"
127
			"stf.spill [%2]=f82,0x80\n"
128
			"stf.spill [%3]=f83,0x80\n"
129
			"stf.spill [%4]=f84,0x80\n"
130
			"stf.spill [%5]=f85,0x80\n"
131
			"stf.spill [%6]=f86,0x80\n"
132
			"stf.spill [%7]=f87,0x80\n;;"
133
 
134
			"stf.spill [%0]=f88,0x80\n"
135
			"stf.spill [%1]=f89,0x80\n"
136
			"stf.spill [%2]=f90,0x80\n"
137
			"stf.spill [%3]=f91,0x80\n"
138
			"stf.spill [%4]=f92,0x80\n"
139
			"stf.spill [%5]=f93,0x80\n"
140
			"stf.spill [%6]=f94,0x80\n"
141
			"stf.spill [%7]=f95,0x80\n;;"
142
 
143
 
144
			"stf.spill [%0]=f96,0x80\n"
145
			"stf.spill [%1]=f97,0x80\n"
146
			"stf.spill [%2]=f98,0x80\n"
147
			"stf.spill [%3]=f99,0x80\n"
148
			"stf.spill [%4]=f100,0x80\n"
149
			"stf.spill [%5]=f101,0x80\n"
150
			"stf.spill [%6]=f102,0x80\n"
151
			"stf.spill [%7]=f103,0x80\n;;"
152
 
153
			"stf.spill [%0]=f104,0x80\n"
154
			"stf.spill [%1]=f105,0x80\n"
155
			"stf.spill [%2]=f106,0x80\n"
156
			"stf.spill [%3]=f107,0x80\n"
157
			"stf.spill [%4]=f108,0x80\n"
158
			"stf.spill [%5]=f109,0x80\n"
159
			"stf.spill [%6]=f110,0x80\n"
160
			"stf.spill [%7]=f111,0x80\n;;"
161
 
162
			"stf.spill [%0]=f112,0x80\n"
163
			"stf.spill [%1]=f113,0x80\n"
164
			"stf.spill [%2]=f114,0x80\n"
165
			"stf.spill [%3]=f115,0x80\n"
166
			"stf.spill [%4]=f116,0x80\n"
167
			"stf.spill [%5]=f117,0x80\n"
168
			"stf.spill [%6]=f118,0x80\n"
169
			"stf.spill [%7]=f119,0x80\n;;"
170
 
171
			"stf.spill [%0]=f120,0x80\n"
172
			"stf.spill [%1]=f121,0x80\n"
173
			"stf.spill [%2]=f122,0x80\n"
174
			"stf.spill [%3]=f123,0x80\n"
175
			"stf.spill [%4]=f124,0x80\n"
176
			"stf.spill [%5]=f125,0x80\n"
177
			"stf.spill [%6]=f126,0x80\n"
178
			"stf.spill [%7]=f127,0x80\n;;"
179
 
180
 
181
			:
182
			:"r" (&((fctx->fr)[0])),"r" (&((fctx->fr)[1])),"r" (&((fctx->fr)[2])),"r" (&((fctx->fr)[3])),
183
			 "r" (&((fctx->fr)[4])),"r" (&((fctx->fr)[5])),"r" (&((fctx->fr)[6])),"r" (&((fctx->fr)[7]))
184
		); 
185
 
52 vana 186
}
187
 
188
 
57 vana 189
void fpu_context_restore(fpu_context_t *fctx)
52 vana 190
{
979 vana 191
		asm volatile(
192
			"ldf.fill f2=[%2],0x80\n"
193
			"ldf.fill f3=[%3],0x80\n"
194
			"ldf.fill f4=[%4],0x80\n"
195
			"ldf.fill f5=[%5],0x80\n"
196
			"ldf.fill f6=[%6],0x80\n"
197
			"ldf.fill f7=[%7],0x80\n;;"
198
 
199
			"ldf.fill f8=[%0],0x80\n"
200
			"ldf.fill f9=[%1],0x80\n"
201
			"ldf.fill f10=[%2],0x80\n"
202
			"ldf.fill f11=[%3],0x80\n"
203
			"ldf.fill f12=[%4],0x80\n"
204
			"ldf.fill f13=[%5],0x80\n"
205
			"ldf.fill f14=[%6],0x80\n"
206
			"ldf.fill f15=[%7],0x80\n;;"
207
 
208
			"ldf.fill f16=[%0],0x80\n"
209
			"ldf.fill f17=[%1],0x80\n"
210
			"ldf.fill f18=[%2],0x80\n"
211
			"ldf.fill f19=[%3],0x80\n"
212
			"ldf.fill f20=[%4],0x80\n"
213
			"ldf.fill f21=[%5],0x80\n"
214
			"ldf.fill f22=[%6],0x80\n"
215
			"ldf.fill f23=[%7],0x80\n;;"
216
 
217
			"ldf.fill f24=[%0],0x80\n"
218
			"ldf.fill f25=[%1],0x80\n"
219
			"ldf.fill f26=[%2],0x80\n"
220
			"ldf.fill f27=[%3],0x80\n"
221
			"ldf.fill f28=[%4],0x80\n"
222
			"ldf.fill f29=[%5],0x80\n"
223
			"ldf.fill f30=[%6],0x80\n"
224
			"ldf.fill f31=[%7],0x80\n;;"
225
 
226
 
227
			"ldf.fill f32=[%0],0x80\n"
228
			"ldf.fill f33=[%1],0x80\n"
229
			"ldf.fill f34=[%2],0x80\n"
230
			"ldf.fill f35=[%3],0x80\n"
231
			"ldf.fill f36=[%4],0x80\n"
232
			"ldf.fill f37=[%5],0x80\n"
233
			"ldf.fill f38=[%6],0x80\n"
234
			"ldf.fill f39=[%7],0x80\n;;"
235
 
236
			"ldf.fill f40=[%0],0x80\n"
237
			"ldf.fill f41=[%1],0x80\n"
238
			"ldf.fill f42=[%2],0x80\n"
239
			"ldf.fill f43=[%3],0x80\n"
240
			"ldf.fill f44=[%4],0x80\n"
241
			"ldf.fill f45=[%5],0x80\n"
242
			"ldf.fill f46=[%6],0x80\n"
243
			"ldf.fill f47=[%7],0x80\n;;"
244
 
245
			"ldf.fill f48=[%0],0x80\n"
246
			"ldf.fill f49=[%1],0x80\n"
247
			"ldf.fill f50=[%2],0x80\n"
248
			"ldf.fill f51=[%3],0x80\n"
249
			"ldf.fill f52=[%4],0x80\n"
250
			"ldf.fill f53=[%5],0x80\n"
251
			"ldf.fill f54=[%6],0x80\n"
252
			"ldf.fill f55=[%7],0x80\n;;"
253
 
254
			"ldf.fill f56=[%0],0x80\n"
255
			"ldf.fill f57=[%1],0x80\n"
256
			"ldf.fill f58=[%2],0x80\n"
257
			"ldf.fill f59=[%3],0x80\n"
258
			"ldf.fill f60=[%4],0x80\n"
259
			"ldf.fill f61=[%5],0x80\n"
260
			"ldf.fill f62=[%6],0x80\n"
261
			"ldf.fill f63=[%7],0x80\n;;"
262
 
263
			"ldf.fill f64=[%0],0x80\n"
264
			"ldf.fill f65=[%1],0x80\n"
265
			"ldf.fill f66=[%2],0x80\n"
266
			"ldf.fill f67=[%3],0x80\n"
267
			"ldf.fill f68=[%4],0x80\n"
268
			"ldf.fill f69=[%5],0x80\n"
269
			"ldf.fill f70=[%6],0x80\n"
270
			"ldf.fill f71=[%7],0x80\n;;"
271
 
272
			"ldf.fill f72=[%0],0x80\n"
273
			"ldf.fill f73=[%1],0x80\n"
274
			"ldf.fill f74=[%2],0x80\n"
275
			"ldf.fill f75=[%3],0x80\n"
276
			"ldf.fill f76=[%4],0x80\n"
277
			"ldf.fill f77=[%5],0x80\n"
278
			"ldf.fill f78=[%6],0x80\n"
279
			"ldf.fill f79=[%7],0x80\n;;"
280
 
281
			"ldf.fill f80=[%0],0x80\n"
282
			"ldf.fill f81=[%1],0x80\n"
283
			"ldf.fill f82=[%2],0x80\n"
284
			"ldf.fill f83=[%3],0x80\n"
285
			"ldf.fill f84=[%4],0x80\n"
286
			"ldf.fill f85=[%5],0x80\n"
287
			"ldf.fill f86=[%6],0x80\n"
288
			"ldf.fill f87=[%7],0x80\n;;"
289
 
290
			"ldf.fill f88=[%0],0x80\n"
291
			"ldf.fill f89=[%1],0x80\n"
292
			"ldf.fill f90=[%2],0x80\n"
293
			"ldf.fill f91=[%3],0x80\n"
294
			"ldf.fill f92=[%4],0x80\n"
295
			"ldf.fill f93=[%5],0x80\n"
296
			"ldf.fill f94=[%6],0x80\n"
297
			"ldf.fill f95=[%7],0x80\n;;"
298
 
299
 
300
			"ldf.fill f96=[%0],0x80\n"
301
			"ldf.fill f97=[%1],0x80\n"
302
			"ldf.fill f98=[%2],0x80\n"
303
			"ldf.fill f99=[%3],0x80\n"
304
			"ldf.fill f100=[%4],0x80\n"
305
			"ldf.fill f101=[%5],0x80\n"
306
			"ldf.fill f102=[%6],0x80\n"
307
			"ldf.fill f103=[%7],0x80\n;;"
308
 
309
			"ldf.fill f104=[%0],0x80\n"
310
			"ldf.fill f105=[%1],0x80\n"
311
			"ldf.fill f106=[%2],0x80\n"
312
			"ldf.fill f107=[%3],0x80\n"
313
			"ldf.fill f108=[%4],0x80\n"
314
			"ldf.fill f109=[%5],0x80\n"
315
			"ldf.fill f110=[%6],0x80\n"
316
			"ldf.fill f111=[%7],0x80\n;;"
317
 
318
			"ldf.fill f112=[%0],0x80\n"
319
			"ldf.fill f113=[%1],0x80\n"
320
			"ldf.fill f114=[%2],0x80\n"
321
			"ldf.fill f115=[%3],0x80\n"
322
			"ldf.fill f116=[%4],0x80\n"
323
			"ldf.fill f117=[%5],0x80\n"
324
			"ldf.fill f118=[%6],0x80\n"
325
			"ldf.fill f119=[%7],0x80\n;;"
326
 
327
			"ldf.fill f120=[%0],0x80\n"
328
			"ldf.fill f121=[%1],0x80\n"
329
			"ldf.fill f122=[%2],0x80\n"
330
			"ldf.fill f123=[%3],0x80\n"
331
			"ldf.fill f124=[%4],0x80\n"
332
			"ldf.fill f125=[%5],0x80\n"
333
			"ldf.fill f126=[%6],0x80\n"
334
			"ldf.fill f127=[%7],0x80\n;;"
335
 
336
 
337
			:
338
			:"r" (&((fctx->fr)[0])),"r" (&((fctx->fr)[1])),"r" (&((fctx->fr)[2])),"r" (&((fctx->fr)[3])),
339
			 "r" (&((fctx->fr)[4])),"r" (&((fctx->fr)[5])),"r" (&((fctx->fr)[6])),"r" (&((fctx->fr)[7]))
340
		); 
341
 
342
 
52 vana 343
}
344
 
1023 vana 345
void fpu_disable(void)
346
{
347
		asm volatile(
348
			"ssm %0;;\n"
349
			"srlz.i\n"
350
			"srlz.d;;\n"
351
			:
352
			:"i" (PSR_DFL_MASK|PSR_DFH_MASK)
353
		);
979 vana 354
 
1023 vana 355
}
979 vana 356
 
1023 vana 357
void fpu_enable(void)
358
{
359
		asm volatile(
360
			"rsm %0;;\n"
361
			"srlz.i\n"
362
			"srlz.d;;\n"
363
			:
364
			:"i" (PSR_DFL_MASK|PSR_DFH_MASK)
365
		);
366
 
367
}
368
 
369
void fpu_init(void)
370
{
371
		__u64 a = 0;
372
		fpu_enable();
373
		asm volatile
374
		(
375
			"mov %0=ar.fpsr;;\n"
376
			"or %0=%0,%1;;\n"
377
			"mov ar.fpsr=%0;;\n"
378
			: "+r" (a)
379
			: "r" (0x38)
380
		);
381
 
382
		asm volatile(
383
			"mov f2=f0\n"
384
			"mov f3=f0\n"
385
			"mov f4=f0\n"
386
			"mov f5=f0\n"
387
			"mov f6=f0\n"
388
			"mov f7=f0\n"
389
			"mov f8=f0\n"
390
			"mov f9=f0\n"
391
 
392
			"mov f10=f0\n"
393
			"mov f11=f0\n"
394
			"mov f12=f0\n"
395
			"mov f13=f0\n"
396
			"mov f14=f0\n"
397
			"mov f15=f0\n"
398
			"mov f16=f0\n"
399
			"mov f17=f0\n"
400
			"mov f18=f0\n"
401
			"mov f19=f0\n"
402
 
403
			"mov f20=f0\n"
404
			"mov f21=f0\n"
405
			"mov f22=f0\n"
406
			"mov f23=f0\n"
407
			"mov f24=f0\n"
408
			"mov f25=f0\n"
409
			"mov f26=f0\n"
410
			"mov f27=f0\n"
411
			"mov f28=f0\n"
412
			"mov f29=f0\n"
413
 
414
			"mov f30=f0\n"
415
			"mov f31=f0\n"
416
			"mov f32=f0\n"
417
			"mov f33=f0\n"
418
			"mov f34=f0\n"
419
			"mov f35=f0\n"
420
			"mov f36=f0\n"
421
			"mov f37=f0\n"
422
			"mov f38=f0\n"
423
			"mov f39=f0\n"
424
 
425
			"mov f40=f0\n"
426
			"mov f41=f0\n"
427
			"mov f42=f0\n"
428
			"mov f43=f0\n"
429
			"mov f44=f0\n"
430
			"mov f45=f0\n"
431
			"mov f46=f0\n"
432
			"mov f47=f0\n"
433
			"mov f48=f0\n"
434
			"mov f49=f0\n"
435
 
436
			"mov f50=f0\n"
437
			"mov f51=f0\n"
438
			"mov f52=f0\n"
439
			"mov f53=f0\n"
440
			"mov f54=f0\n"
441
			"mov f55=f0\n"
442
			"mov f56=f0\n"
443
			"mov f57=f0\n"
444
			"mov f58=f0\n"
445
			"mov f59=f0\n"
446
 
447
			"mov f60=f0\n"
448
			"mov f61=f0\n"
449
			"mov f62=f0\n"
450
			"mov f63=f0\n"
451
			"mov f64=f0\n"
452
			"mov f65=f0\n"
453
			"mov f66=f0\n"
454
			"mov f67=f0\n"
455
			"mov f68=f0\n"
456
			"mov f69=f0\n"
457
 
458
			"mov f70=f0\n"
459
			"mov f71=f0\n"
460
			"mov f72=f0\n"
461
			"mov f73=f0\n"
462
			"mov f74=f0\n"
463
			"mov f75=f0\n"
464
			"mov f76=f0\n"
465
			"mov f77=f0\n"
466
			"mov f78=f0\n"
467
			"mov f79=f0\n"
468
 
469
			"mov f80=f0\n"
470
			"mov f81=f0\n"
471
			"mov f82=f0\n"
472
			"mov f83=f0\n"
473
			"mov f84=f0\n"
474
			"mov f85=f0\n"
475
			"mov f86=f0\n"
476
			"mov f87=f0\n"
477
			"mov f88=f0\n"
478
			"mov f89=f0\n"
479
 
480
			"mov f90=f0\n"
481
			"mov f91=f0\n"
482
			"mov f92=f0\n"
483
			"mov f93=f0\n"
484
			"mov f94=f0\n"
485
			"mov f95=f0\n"
486
			"mov f96=f0\n"
487
			"mov f97=f0\n"
488
			"mov f98=f0\n"
489
			"mov f99=f0\n"
490
 
491
			"mov f100=f0\n"
492
			"mov f101=f0\n"
493
			"mov f102=f0\n"
494
			"mov f103=f0\n"
495
			"mov f104=f0\n"
496
			"mov f105=f0\n"
497
			"mov f106=f0\n"
498
			"mov f107=f0\n"
499
			"mov f108=f0\n"
500
			"mov f109=f0\n"
501
 
502
			"mov f110=f0\n"
503
			"mov f111=f0\n"
504
			"mov f112=f0\n"
505
			"mov f113=f0\n"
506
			"mov f114=f0\n"
507
			"mov f115=f0\n"
508
			"mov f116=f0\n"
509
			"mov f117=f0\n"
510
			"mov f118=f0\n"
511
			"mov f119=f0\n"
512
 
513
			"mov f120=f0\n"
514
			"mov f121=f0\n"
515
			"mov f122=f0\n"
516
			"mov f123=f0\n"
517
			"mov f124=f0\n"
518
			"mov f125=f0\n"
519
			"mov f126=f0\n"
520
			"mov f127=f0\n"
521
 
522
		);
523
 
524
		fpu_enable();
525
}
526