Goal: Use OpenMP to evaluate different adjoint vectors at the same time.
Prerequisite: Example 2 - Custom adjoint vector evaluation
Function: Simple vector valued function
template<typename Real>
void func(
const Real* x,
size_t l,
Real* y) {
y[0] = 0.0;
y[1] = 1.0;
for(size_t i = 0; i < l; ++i) {
y[0] += x[i];
y[1] *= x[i];
}
}
Full code:
#include <codi.hpp>
#include <iostream>
#include <omp.h>
template<typename Real>
void func(
const Real* x,
size_t l,
Real* y) {
y[0] = 0.0;
y[1] = 1.0;
for(size_t i = 0; i < l; ++i) {
y[0] += x[i];
y[1] *= x[i];
}
}
int main(int nargs, char** args) {
x[0] = 1.0;
x[1] = 2.0;
x[2] = 3.0;
x[3] = 4.0;
x[4] = 5.0;
tape.setActive();
for(size_t i = 0; i < 5; ++i) {
tape.registerInput(x[i]);
}
func(x, 5, y);
tape.registerOutput(y[0]);
tape.registerOutput(y[1]);
tape.setPassive();
#pragma omp parallel num_threads(2)
{
int tid = omp_get_thread_num();
for(size_t i = 0; i < 5; ++i) {
}
}
std::cout << "Custom adjoint vector helper:" << std::endl;
std::cout << "f(1 .. 5) = (" << y[0] << ", " << y[1] << ")" << std::endl;
std::cout << "df/dx (1 .. 5) = \n" << jacobian << std::endl;
tape.reset();
}
tape.evaluate()
can not be used with OpenMP since both threads would use the internal adjoint vector of the tape concurrently.