blob: ee4a8e9c76f6829ab0101a10f7dee16e01720954 [file] [log] [blame] [edit]
// RUN: %clang++ -mllvm -force-vector-width=1 -ffast-math -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O3 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O2 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O1 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions %O0TBAA %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O3 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O2 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
// RUN: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions -O1 %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
// TODO: %clang++ -fno-unroll-loops -fno-vectorize -fno-slp-vectorize -fno-exceptions %O0TBAA %s -S -emit-llvm -o - | %opt - %OPloadEnzyme %enzyme -enzyme-inline=1 -S | %lli -
#define EIGEN_NO_AUTOMATIC_RESIZING 1
#define EIGEN_DONT_ALIGN 1
#define EIGEN_NO_DEBUG 1
#define EIGEN_UNROLLING_LIMIT 0
#define EIGEN_DONT_VECTORIZE 1
#include "../test_utils.h"
#include <eigen3/Eigen/Dense>
#include <math.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/time.h>
#include <stdlib.h>
#include <math.h>
#include <inttypes.h>
#include <stdlib.h>
#include <string.h>
using Eigen::MatrixXd;
using Eigen::Matrix;
using Eigen::VectorXd;
constexpr size_t IN = 4, OUT = 4, NUM = 5;
extern "C" {
extern double __enzyme_autodiff(void*, const Matrix<double, IN, OUT>* __restrict W, const Matrix<double, IN, OUT>* __restrict Wp, const Matrix<double, IN, OUT>* __restrict M, const Matrix<double, IN, OUT>* __restrict Mp);
}
__attribute__((noinline))
static double matvec(const Matrix<double, IN, OUT>* __restrict W, const Matrix<double, IN, OUT>* __restrict M) {
Matrix<double, IN, OUT> diff = *W-*M;
return (diff*diff).sum();
}
int main(int argc, char** argv) {
//size_t IN = 40, OUT = 30, NUM = 50;
Matrix<double, IN, OUT> W(IN, OUT);
Matrix<double, IN, OUT> Wp(IN, OUT);
Matrix<double, IN, OUT> M(IN, OUT);
Matrix<double, IN, OUT> Mp(IN, OUT);
W = Eigen::Matrix<double, IN, OUT>::Constant(IN, OUT, 1.0);
M = Eigen::Matrix<double, IN, OUT>::Constant(IN, OUT, 2.0);
Wp = Eigen::Matrix<double, IN, OUT>::Constant(IN, OUT, 0.0);
Mp = Eigen::Matrix<double, IN, OUT>::Constant(IN, OUT, 0.0);
__enzyme_autodiff((void*)matvec, &W, &Wp, &M, &Mp);
for(int o=0; o<OUT; o++)
for(int i=0; i<IN; i++) {
APPROX_EQ( Wp(i, o), -8., 1e-10);
fprintf(stderr, "Wp(o=%d, i=%d)=%f\n", i, o, Wp(i, o));
}
for(int o=0; o<OUT; o++)
for(int i=0; i<IN; i++) {
APPROX_EQ( Mp(i, o), 8., 1e-10);
fprintf(stderr, "Mp(o=%d, i=%d)=%f\n", i, o, Mp(i, o));
}
}