~melchizedek6809/WolkenWelten

ref: e910bd82e598d6f560b8899dd1d88fb3ed554cd3 WolkenWelten/common/src/asm/armv7l.s -rw-r--r-- 2.1 KiB
e910bd82Ben (X13/Arch) Updated contact info 11 months ago
                                                                                
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
.text
.global sparticlePosUpdateNEON
.global  particlePosUpdateNEON
.global      rainPosUpdateNEON

rainPosUpdateNEON:
  ldr r3,=rainCount
  ldr r1,[r3]
  lsr r1,r1,#1
  add r1,r1,#1

  ldr r3,=rainVel
  vld1.32 {q4},[r3]

  mov r12,#16
  ldr r2,=glRainDrops
  ldr r3,=rainDrops
.rainPosUpdateLoopNEON:
  vld1.32 {q0},[r2]
  vld1.32 {q1},[r3]
  vadd.f32 q0,q0,q1
  vst1.32 {q0},[r2],r12
  vadd.f32 q1,q1,q4
  vst1.32 {q1},[r3],r12

  vld1.32 {q2},[r2]
  vld1.32 {q3},[r3]
  vadd.f32 q2,q2,q3
  vst1.32 {q2},[r2],r12
  vadd.f32 q3,q3,q4
  vst1.32 {q3},[r3],r12

  subs r1,r1,#1
  bne .rainPosUpdateLoopNEON
  mov pc, lr


particlePosUpdateNEON:
  ldr r3,=particleCount
  ldr r1,[r3]
  lsr r1,r1,#2
  add r1,r1,#1

  ldr r2,=glParticles
  ldr r3,=particles
  mov r12,#16
.particlePosUpdateLoopNEON:

  vld1.32 {q0},[r2]
  vld1.32 {q1},[r3],r12
  vadd.f32 q0,q0,q1
  vst1.32 {q0},[r2],r12

  vld1.32 {q2},[r2]
  vld1.32 {q3},[r3],r12
  vadd.f32 q2,q2,q3
  vst1.32 {q2},[r2],r12

  vld1.32 {q4},[r2]
  vld1.32 {q5},[r3],r12
  vadd.f32 q4,q4,q5
  vst1.32 {q4},[r2],r12

  vld1.32 {q6},[r2]
  vld1.32 {q7},[r3],r12
  vadd.f32 q6,q6,q7
  vst1.32 {q6},[r2],r12

  subs r1,r1,#1
  bne .particlePosUpdateLoopNEON
  mov pc, lr


sparticlePosUpdateNEON:
  ldr r3,=sparticleCount
  ldr r1,[r3]
  lsr r1,r1,#2
  add r1,r1,#1

  mov r12,#16
  ldr r3,=sparticleVV
  vld1.32 { q8},[r3],r12
  vld1.32 { q9},[r3],r12
  vld1.32 {q10},[r3],r12
  vld1.32 {q11},[r3],r12

  ldr r2,=glSparticles
  ldr r3,=sparticles
.sparticlePosUpdateLoopNEON:

  vld1.32 {q0},[r2]
  vld1.32 {q1},[r3]
  vadd.f32 q0,q0,q1
  vadd.f32 q1,q8,q1
  vst1.32 {q0},[r2],r12
  vst1.32 {q1},[r3],r12

  vld1.32 {q2},[r2]
  vld1.32 {q3},[r3]
  vadd.f32 q2,q2,q3
  vadd.f32 q3,q9,q3
  vst1.32 {q2},[r2],r12
  vst1.32 {q3},[r3],r12

  vld1.32 {q4},[r2]
  vld1.32 {q5},[r3]
  vadd.f32 q4, q4,q5
  vadd.f32 q5,q10,q5
  vst1.32 {q4},[r2],r12
  vst1.32 {q5},[r3],r12

  vld1.32 {q6},[r2]
  vld1.32 {q7},[r3]
  vadd.f32 q6, q6,q7
  vadd.f32 q7,q11,q7
  vst1.32 {q6},[r2],r12
  vst1.32 {q7},[r3],r12

  subs r1,r1,#1
  bne .sparticlePosUpdateLoopNEON
  mov pc, lr