forked from ssvb/cpuburn-arm
-
Notifications
You must be signed in to change notification settings - Fork 0
/
cpuburn-a9.S
97 lines (91 loc) · 3.03 KB
/
cpuburn-a9.S
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
/*
* Copyright © 2012 Siarhei Siamashka <[email protected]>
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS IN THE SOFTWARE.
*/
/*
* This program tries to stress ARM Cortex-A9 processor to generate as
* much heat as possible. Needs NEON, so does not work on Tegra 2.
* WARNING: improperly cooled or otherwise flawed hardware may potentially
* overheat and fail. Use at your own risk.
*
* Compilation instructions:
* $ arm-linux-gnueabihf-gcc -o cpuburn-a9 cpuburn-a9.S
*
* See http://ssvb.github.com/2012/04/10/cpuburn-arm-cortex-a9.html
* for more details.
*/
.syntax unified
.text
.arch armv7-a
.fpu neon
.arm
.global main
.global sysconf
.global fork
/* optimal value for LOOP_UNROLL_FACTOR seems to be BTB size dependent */
#define LOOP_UNROLL_FACTOR 110
/* 64 seems to be a good choice */
#define STEP 64
.func main
.type main, %function
main:
#ifdef __linux__
mov r0, 84 /* _SC_NPROCESSORS_ONLN */
blx sysconf
mov r4, r0
cmp r4, #2
blt 1f
blx fork /* have at least 2 cores */
cmp r4, #4
blt 1f
blx fork /* have at least 4 cores */
1:
#endif
ldr lr, =(STEP * 4 + 15)
subs lr, sp, lr
bic lr, lr, #15
mov ip, #STEP
mov r0, #0
mov r1, #0
mov r2, #0
mov r3, #0
ldr r4, =0xFFFFFFFF
b 0f
.ltorg
0:
.rept LOOP_UNROLL_FACTOR
vld2.8 {q0}, [lr, :128], ip
it ne
smlalne r0, r1, lr, r4
bne 1f
1:
vld2.8 {q1}, [lr, :128], ip
it ne
smlalne r2, r3, lr, r4
bne 1f
1:
vld2.8 {q2}, [lr, :128], ip
vld2.8 {q3}, [lr, :128], ip
it ne
subsne lr, lr, #(STEP * 4)
.endr
bne 0b
.endfunc