37 #include "TinyFadET/tfad.h" 48 void FAD::error(
const char *msg) {
49 std::cout << msg << std::endl;
53 double xi[3], xj[3], pa[4],
f[3], delr[3];
59 T delr0 = xi[0]-xj[0];
60 T delr1 = xi[1]-xj[1];
61 T delr2 = xi[2]-xj[2];
62 return delr0*delr0 + delr1*delr1 + delr2*delr2;
68 delr[0] = xi[0]-xj[0];
69 delr[1] = xi[1]-xj[1];
70 delr[2] = xi[2]-xj[2];
71 return delr[0]*delr[0] + delr[1]*delr[1] + delr[2]*delr[2];
76 lj(
const T xi[],
const double xj[],
T& energy) {
79 T delr_6 = delr_2*delr_2*delr_2;
80 energy = (pa[1]*delr_6 - pa[2])*delr_6 - pa[3];
84 lj_and_grad(
const double xi[],
const double xj[],
double& energy,
87 double delr_2 = 1.0/delr2;
88 double delr_6 = delr_2*delr_2*delr_2;
89 energy = (pa[1]*delr_6 - pa[2])*delr_6 - pa[3];
90 double tmp = (-12.0*pa[1]*delr_6 - 6.0*pa[2])*delr_6*delr_2;
96 template <
typename FadType>
103 for (
int i=0; i<3; i++) {
104 xi_fad[i] =
FadType(3, i, xi[i]);
108 for (
int j=0; j<nloop; j++) {
110 lj(xi_fad, xj, energy);
112 for (
int i=0; i<3; i++)
113 f[i] += -energy.fastAccessDx(i);
124 double energy, ff[3];
127 for (
int j=0; j<nloop; j++) {
131 for (
int i=0; i<3; i++)
140 int main(
int argc,
char* argv[]) {
150 clp.
setDocString(
"This program tests the speed of various forward mode AD implementations for a single multiplication operation");
152 clp.
setOption(
"nloop", &nloop,
"Number of loops");
156 parseReturn= clp.
parse(argc, argv);
165 std::cout.setf(std::ios::scientific);
166 std::cout.precision(p);
167 std::cout <<
"Times (sec) nloop = " << nloop <<
": " << std::endl;
170 for (
int i=0; i<3; i++) {
178 std::cout <<
"Analytic: " << std::setw(w) << ta << std::endl;
180 t = do_time< FAD::TFad<3,double> >(nloop);
181 std::cout <<
"TFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
183 t = do_time< FAD::Fad<double> >(nloop);
184 std::cout <<
"Fad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
186 t = do_time< Sacado::Fad::SFad<double,3> >(nloop);
187 std::cout <<
"SFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
189 t = do_time< Sacado::Fad::SLFad<double,3> >(nloop);
190 std::cout <<
"SLFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
192 t = do_time< Sacado::Fad::DFad<double> >(nloop);
193 std::cout <<
"DFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
195 t = do_time< Sacado::Fad::DMFad<double> >(nloop);
196 std::cout <<
"DMFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
198 t = do_time< Sacado::ELRFad::SFad<double,3> >(nloop);
199 std::cout <<
"ELRSFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
201 t = do_time< Sacado::ELRFad::SLFad<double,3> >(nloop);
202 std::cout <<
"ELRSLFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
204 t = do_time< Sacado::ELRFad::DFad<double> >(nloop);
205 std::cout <<
"ELRDFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
207 t = do_time< Sacado::CacheFad::DFad<double> >(nloop);
208 std::cout <<
"CacheFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
210 t = do_time< Sacado::Fad::DVFad<double> >(nloop);
211 std::cout <<
"DVFad: " << std::setw(w) << t <<
"\t" << std::setw(w) << t/ta << std::endl;
214 catch (std::exception& e) {
215 std::cout << e.what() << std::endl;
218 catch (
const char *s) {
219 std::cout << s << std::endl;
223 std::cout <<
"Caught unknown exception!" << std::endl;
MemPool * getMemoryPool(unsigned int dim)
Get memory pool for supplied dimension dim.
Sacado::Fad::DFad< double > FadType
double do_time_analytic(int nloop)
ScalarT number()
Get random number.
double do_time(int nloop)
void start(bool reset=false)
int main(int argc, char *argv[])
void setOption(const char option_true[], const char option_false[], bool *option_val, const char documentation[]=NULL)
Derivative array storage class using dynamic memory allocation.
EParseCommandLineReturn parse(int argc, char *argv[], std::ostream *errout=&std::cerr) const
double totalElapsedTime(bool readCurrentTime=false) const
void lj_and_grad(const double xi[], const double xj[], double &energy, double f[])
void setDocString(const char doc_string[])
Forward-mode AD class using dynamic memory allocation and expression templates.
void lj(const T xi[], const double xj[], T &energy)
T vec3_distsq(const T xi[], const double xj[])