blob: 4076978d1af673671fd57667debfc90e3b669256 [file] [log] [blame] [edit]
// RUN: %clang++ -mllvm -force-vector-width=1 -ffast-math -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O3 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-loose-types -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O2 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-loose-types -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O1 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-loose-types -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions %O0TBAA %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O3 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O2 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O1 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
// TODO: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O0 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
#define EIGEN_NO_AUTOMATIC_RESIZING 1
#define EIGEN_DONT_ALIGN 1
#define EIGEN_NO_DEBUG 1
#define EIGEN_UNROLLING_LIMIT 0
#define EIGEN_DONT_VECTORIZE 1
#include "../test_utils.h"
#include <eigen3/Eigen/Dense>
#include <math.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/time.h>
#include <stdlib.h>
#include <math.h>
#include <inttypes.h>
#include <stdlib.h>
#include <string.h>
using Eigen::MatrixXd;
using Eigen::Matrix;
using Eigen::VectorXd;
constexpr size_t IN = 4, OUT = 4, NUM = 5;
extern "C" {
extern double __enzyme_autodiff(void*, const MatrixXd* __restrict W, const MatrixXd* __restrict Wp, const MatrixXd* __restrict M, const MatrixXd* __restrict Mp);
}
__attribute__((noinline))
static double matvec(const MatrixXd* __restrict W, const MatrixXd* __restrict M) {
MatrixXd diff = *W-*M;
return (diff*diff).sum();
}
int main(int argc, char** argv) {
//size_t IN = 40, OUT = 30, NUM = 50;
MatrixXd W = Eigen::MatrixXd::Constant(IN, OUT, 1.0);
MatrixXd M = Eigen::MatrixXd::Constant(IN, OUT, 2.0);
MatrixXd Wp = Eigen::MatrixXd::Constant(IN, OUT, 0.0);
MatrixXd Mp = Eigen::MatrixXd::Constant(IN, OUT, 0.0);
__enzyme_autodiff((void*)matvec, &W, &Wp, &M, &Mp);
for(int o=0; o<OUT; o++)
for(int i=0; i<IN; i++) {
APPROX_EQ( Wp(i, o), -8., 1e-10);
fprintf(stderr, "Wp(o=%d, i=%d)=%f\n", i, o, Wp(i, o));
}
for(int o=0; o<OUT; o++)
for(int i=0; i<IN; i++) {
APPROX_EQ( Mp(i, o), 8., 1e-10);
fprintf(stderr, "Mp(o=%d, i=%d)=%f\n", i, o, Mp(i, o));
}
}