Geant4 10.7.0
Toolkit for the simulation of the passage of particles through matter
Loading...
Searching...
No Matches
G4Exp.hh
Go to the documentation of this file.
1//
2// ********************************************************************
3// * License and Disclaimer *
4// * *
5// * The Geant4 software is copyright of the Copyright Holders of *
6// * the Geant4 Collaboration. It is provided under the terms and *
7// * conditions of the Geant4 Software License, included in the file *
8// * LICENSE and available at http://cern.ch/geant4/license . These *
9// * include a list of copyright holders. *
10// * *
11// * Neither the authors of this software system, nor their employing *
12// * institutes,nor the agencies providing financial support for this *
13// * work make any representation or warranty, express or implied, *
14// * regarding this software system or assume any liability for its *
15// * use. Please see the license in the file LICENSE and URL above *
16// * for the full disclaimer and the limitation of liability. *
17// * *
18// * This code implementation is the result of the scientific and *
19// * technical work of the GEANT4 collaboration. *
20// * By using, copying, modifying or distributing the software (or *
21// * any work based on the software) you agree to acknowledge its *
22// * use in resulting scientific publications, and indicate your *
23// * acceptance of all terms of the Geant4 Software license. *
24// ********************************************************************
25//
26// G4Exp
27//
28// Class description:
29//
30// The basic idea is to exploit Pade polynomials.
31// A lot of ideas were inspired by the cephes math library
32// (by Stephen L. Moshier [email protected]) as well as actual code.
33// The Cephes library can be found here: http://www.netlib.org/cephes/
34// Code and algorithms for G4Exp have been extracted and adapted for Geant4
35// from the original implementation in the VDT mathematical library
36// (https://svnweb.cern.ch/trac/vdt), version 0.3.7.
37
38// Original implementation created on: Jun 23, 2012
39// Authors: Danilo Piparo, Thomas Hauth, Vincenzo Innocente
40//
41// --------------------------------------------------------------------
42/*
43 * VDT is free software: you can redistribute it and/or modify
44 * it under the terms of the GNU Lesser Public License as published by
45 * the Free Software Foundation, either version 3 of the License, or
46 * (at your option) any later version.
47 *
48 * This program is distributed in the hope that it will be useful,
49 * but WITHOUT ANY WARRANTY; without even the implied warranty of
50 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
51 * GNU Lesser Public License for more details.
52 *
53 * You should have received a copy of the GNU Lesser Public License
54 * along with this program. If not, see <http://www.gnu.org/licenses/>.
55 */
56// --------------------------------------------------------------------
57#ifndef G4Exp_hh
58#define G4Exp_hh 1
59
60#ifdef WIN32
61
62# define G4Exp std::exp
63
64#else
65
66# include "G4Types.hh"
67# include <limits>
68# include <stdint.h>
69
70namespace G4ExpConsts
71{
72 const G4double EXP_LIMIT = 708;
73
74 const G4double PX1exp = 1.26177193074810590878E-4;
75 const G4double PX2exp = 3.02994407707441961300E-2;
76 const G4double PX3exp = 9.99999999999999999910E-1;
77 const G4double QX1exp = 3.00198505138664455042E-6;
78 const G4double QX2exp = 2.52448340349684104192E-3;
79 const G4double QX3exp = 2.27265548208155028766E-1;
80 const G4double QX4exp = 2.00000000000000000009E0;
81
82 const G4double LOG2E = 1.4426950408889634073599; // 1/log(2)
83
84 const G4float MAXLOGF = 88.72283905206835f;
85 const G4float MINLOGF = -88.f;
86
87 const G4float C1F = 0.693359375f;
88 const G4float C2F = -2.12194440e-4f;
89
90 const G4float PX1expf = 1.9875691500E-4f;
91 const G4float PX2expf = 1.3981999507E-3f;
92 const G4float PX3expf = 8.3334519073E-3f;
93 const G4float PX4expf = 4.1665795894E-2f;
94 const G4float PX5expf = 1.6666665459E-1f;
95 const G4float PX6expf = 5.0000001201E-1f;
96
97 const G4float LOG2EF = 1.44269504088896341f;
98
99 //----------------------------------------------------------------------------
100 // Used to switch between different type of interpretations of the data
101 // (64 bits)
102 //
104 {
106 ieee754(G4double thed) { d = thed; };
107 ieee754(uint64_t thell) { ll = thell; };
108 ieee754(G4float thef) { f[0] = thef; };
109 ieee754(uint32_t thei) { i[0] = thei; };
112 uint32_t i[2];
113 uint64_t ll;
114 uint16_t s[4];
115 };
116
117 //----------------------------------------------------------------------------
118 // Converts an unsigned long long to a double
119 //
120 inline G4double uint642dp(uint64_t ll)
121 {
122 ieee754 tmp;
123 tmp.ll = ll;
124 return tmp.d;
125 }
126
127 //----------------------------------------------------------------------------
128 // Converts an int to a float
129 //
131 {
132 ieee754 tmp;
133 tmp.i[0] = x;
134 return tmp.f[0];
135 }
136
137 //----------------------------------------------------------------------------
138 // Converts a float to an int
139 //
140 inline uint32_t sp2uint32(G4float x)
141 {
142 ieee754 tmp;
143 tmp.f[0] = x;
144 return tmp.i[0];
145 }
146
147 //----------------------------------------------------------------------------
148 /**
149 * A vectorisable floor implementation, not only triggered by fast-math.
150 * These functions do not distinguish between -0.0 and 0.0, so are not IEC6509
151 * compliant for argument -0.0
152 **/
153 inline G4double fpfloor(const G4double x)
154 {
155 // no problem since exp is defined between -708 and 708. Int is enough for
156 // it!
157 int32_t ret = int32_t(x);
158 ret -= (sp2uint32(x) >> 31);
159 return ret;
160 }
161
162 //----------------------------------------------------------------------------
163 /**
164 * A vectorisable floor implementation, not only triggered by fast-math.
165 * These functions do not distinguish between -0.0 and 0.0, so are not IEC6509
166 * compliant for argument -0.0
167 **/
168 inline G4float fpfloor(const G4float x)
169 {
170 int32_t ret = int32_t(x);
171 ret -= (sp2uint32(x) >> 31);
172 return ret;
173 }
174} // namespace G4ExpConsts
175
176// Exp double precision --------------------------------------------------------
177
178/// Exponential Function double precision
179inline G4double G4Exp(G4double initial_x)
180{
181 G4double x = initial_x;
183
184 const int32_t n = int32_t(px);
185
186 x -= px * 6.93145751953125E-1;
187 x -= px * 1.42860682030941723212E-6;
188
189 const G4double xx = x * x;
190
191 // px = x * P(x**2).
193 px *= xx;
195 px *= xx;
197 px *= x;
198
199 // Evaluate Q(x**2).
201 qx *= xx;
203 qx *= xx;
205 qx *= xx;
207
208 // e**x = 1 + 2x P(x**2)/( Q(x**2) - P(x**2) )
209 x = px / (qx - px);
210 x = 1.0 + 2.0 * x;
211
212 // Build 2^n in double.
213 x *= G4ExpConsts::uint642dp((((uint64_t) n) + 1023) << 52);
214
215 if(initial_x > G4ExpConsts::EXP_LIMIT)
216 x = std::numeric_limits<G4double>::infinity();
217 if(initial_x < -G4ExpConsts::EXP_LIMIT)
218 x = 0.;
219
220 return x;
221}
222
223// Exp single precision --------------------------------------------------------
224
225/// Exponential Function single precision
226inline G4float G4Expf(G4float initial_x)
227{
228 G4float x = initial_x;
229
230 G4float z =
232 0.5f); /* std::floor() truncates toward -infinity. */
233
234 x -= z * G4ExpConsts::C1F;
235 x -= z * G4ExpConsts::C2F;
236 const int32_t n = int32_t(z);
237
238 const G4float x2 = x * x;
239
240 z = x * G4ExpConsts::PX1expf;
242 z *= x;
244 z *= x;
246 z *= x;
248 z *= x;
250 z *= x2;
251 z += x + 1.0f;
252
253 /* multiply by power of 2 */
254 z *= G4ExpConsts::uint322sp((n + 0x7f) << 23);
255
256 if(initial_x > G4ExpConsts::MAXLOGF)
257 z = std::numeric_limits<G4float>::infinity();
258 if(initial_x < G4ExpConsts::MINLOGF)
259 z = 0.f;
260
261 return z;
262}
263
264//------------------------------------------------------------------------------
265
266void expv(const uint32_t size, G4double const* __restrict__ iarray,
267 G4double* __restrict__ oarray);
268void G4Expv(const uint32_t size, G4double const* __restrict__ iarray,
269 G4double* __restrict__ oarray);
270void expfv(const uint32_t size, G4float const* __restrict__ iarray,
271 G4float* __restrict__ oarray);
272void G4Expfv(const uint32_t size, G4float const* __restrict__ iarray,
273 G4float* __restrict__ oarray);
274
275#endif /* WIN32 */
276
277#endif
void expv(const uint32_t size, G4double const *__restrict__ iarray, G4double *__restrict__ oarray)
void G4Expfv(const uint32_t size, G4float const *__restrict__ iarray, G4float *__restrict__ oarray)
G4double G4Exp(G4double initial_x)
Exponential Function double precision.
Definition: G4Exp.hh:179
void expfv(const uint32_t size, G4float const *__restrict__ iarray, G4float *__restrict__ oarray)
G4float G4Expf(G4float initial_x)
Exponential Function single precision.
Definition: G4Exp.hh:226
void G4Expv(const uint32_t size, G4double const *__restrict__ iarray, G4double *__restrict__ oarray)
float G4float
Definition: G4Types.hh:84
double G4double
Definition: G4Types.hh:83
int G4int
Definition: G4Types.hh:85
const G4double QX3exp
Definition: G4Exp.hh:79
const G4float C1F
Definition: G4Exp.hh:87
const G4double QX4exp
Definition: G4Exp.hh:80
const G4float PX1expf
Definition: G4Exp.hh:90
G4double uint642dp(uint64_t ll)
Definition: G4Exp.hh:120
const G4double PX3exp
Definition: G4Exp.hh:76
const G4float LOG2EF
Definition: G4Exp.hh:97
const G4double EXP_LIMIT
Definition: G4Exp.hh:72
G4double fpfloor(const G4double x)
Definition: G4Exp.hh:153
const G4float PX6expf
Definition: G4Exp.hh:95
G4float uint322sp(G4int x)
Definition: G4Exp.hh:130
const G4double PX1exp
Definition: G4Exp.hh:74
const G4double QX1exp
Definition: G4Exp.hh:77
const G4float PX4expf
Definition: G4Exp.hh:93
const G4float MINLOGF
Definition: G4Exp.hh:85
const G4float PX3expf
Definition: G4Exp.hh:92
const G4float MAXLOGF
Definition: G4Exp.hh:84
const G4float PX5expf
Definition: G4Exp.hh:94
const G4double PX2exp
Definition: G4Exp.hh:75
const G4double LOG2E
Definition: G4Exp.hh:82
const G4float PX2expf
Definition: G4Exp.hh:91
uint32_t sp2uint32(G4float x)
Definition: G4Exp.hh:140
const G4double QX2exp
Definition: G4Exp.hh:78
const G4float C2F
Definition: G4Exp.hh:88
ieee754(G4double thed)
Definition: G4Exp.hh:106
uint16_t s[4]
Definition: G4Exp.hh:114
uint32_t i[2]
Definition: G4Exp.hh:112
ieee754(uint64_t thell)
Definition: G4Exp.hh:107
ieee754(uint32_t thei)
Definition: G4Exp.hh:109
G4float f[2]
Definition: G4Exp.hh:111
ieee754(G4float thef)
Definition: G4Exp.hh:108