M2-engine/docs/_s_l_p-imp_8hpp_source.html

// Copyright 2015 Anton Leykin and Mike Stillman


// Anton Leykin's code in this file is in the public domain.


#ifndef _slp_imp_hpp_

#define _slp_imp_hpp_


#include <cstdlib>

#include <algorithm>

#include <dlfcn.h>

#include "timing.hpp"


// SLEvaluator

template <typename RT>


SLEvaluatorConcrete<RT>::SLEvaluatorConcrete(

    SLProgram* SLP,

    M2_arrayint cPos,

    M2_arrayint vPos,

    const MutableMat<SMat<RT> >* consts /* DMat<RT>& DMat_consts */)

    : mRing(consts->getMat().ring())

{

  (void) SLP;

  (void) cPos;

  (void) vPos;

  std::cerr << "SLEvaluatorConcrete constructor not defined for sparse matrices\n";

  abort();

}


template <typename RT>


SLEvaluatorConcrete<RT>::SLEvaluatorConcrete(

      M2_string libName,

      int nInputs,

      int nOutputs,

      const MutableMat<SMat<RT> >* empty

      ): mRing(empty->getMat().ring())

{

  (void) libName;

  (void) nInputs;

  (void) nOutputs;

  std::cerr << "SLEvaluatorConcrete constructor not defined for sparse matrices\n";

  abort();

}


template <typename RT>


SLEvaluatorConcrete<RT>::SLEvaluatorConcrete

(M2_string libName,

 int nInputs,

 int nOutputs,

 const MutableMat<DMat<RT> >* empty

 ): mRing(empty->getMat().ring()), isCompiled(true), nInputs(nInputs), nOutputs(nOutputs), nParams(0), parametersAndInputs(nullptr)

{

  slp = NULL;

  //const char* funname = "evaluate";

  const char* funnameRR = "_Z8evaluatePKdPd";

  const char* funnameCC = "_Z8evaluatePKSt7complexIdEPS0_";

  auto libName_std = string_M2_to_std(libName);

  const char* lib_name = libName_std.c_str();

  printf("loading from %s\n", lib_name);

  void* handle = dlopen(lib_name, RTLD_LAZY | RTLD_GLOBAL);

  if (handle == NULL) ERROR("can't load library %s", lib_name);

  compiled_fn = (void (*)(ElementType const*, ElementType*)) dlsym(handle, funnameRR);

  if (compiled_fn == NULL)

    compiled_fn = (void (*)(ElementType const*, ElementType*)) dlsym(handle, funnameCC);

  if (compiled_fn == NULL)

    std::cerr << "can't link function " << funnameRR << " or " << funnameCC << " from library " << lib_name << std::endl;

}


// copy constructor

template <typename RT>


SLEvaluatorConcrete<RT>::SLEvaluatorConcrete(const SLEvaluatorConcrete<RT>& a)

  : SLEvaluator(a), mRing(a.ring()), isCompiled(a.isCompiled), nInputs(a.nInputs), nOutputs(a.nOutputs), values(a.values.size()), compiled_fn(a.compiled_fn), nParams(a.nParams)

{

  slp = a.slp;

  varsPos = a.varsPos;

  auto i = values.begin();

  auto j = a.values.begin();

  for (; i != values.end(); ++i, ++j) ring().init_set(*i, *j);

  // std::cout << "SLEvaluatorConcrete: copy constructor for " << this << std::endl;

  if (a.parametersAndInputs==nullptr) parametersAndInputs = nullptr; else {

    parametersAndInputs = new ElementType[nParams+nInputs];

    std::copy(a.parametersAndInputs,a.parametersAndInputs+nParams, parametersAndInputs);

  }

}


template <typename RT>


SLEvaluatorConcrete<RT>::~SLEvaluatorConcrete()

{

  // std::cout << "~SLEvaluatorConcrete: " << this << std::endl

  if (isCompiled) {// dlclose???

    if (parametersAndInputs!=nullptr) delete[] parametersAndInputs;

  } else for (auto& v : values) ring().clear(v);

}


template <typename RT>


SLEvaluatorConcrete<RT>::SLEvaluatorConcrete

(SLProgram* SLP,

 M2_arrayint cPos,

 M2_arrayint vPos,

 const MutableMat<DMat<RT> >* consts /* DMat<RT>& DMat_consts */

 ): mRing(consts->getMat().ring()), isCompiled(false), compiled_fn(NULL), nParams(0), parametersAndInputs(nullptr)

{

  slp = SLP;

  // for(int i=0; i<cPos->len; i++)

  //  constsPos.push_back(slp->inputCounter+cPos->array[i]);

  for (int i = 0; i < vPos->len; i++)

    varsPos.push_back(slp->inputCounter + vPos->array[i]);

  values.resize(slp->inputCounter + slp->mNodes.size());

  for (auto i = values.begin(); i != values.end(); ++i) ring().init(*i);

  for (int i = 0; i < cPos->len; i++)

    ring().set(values[slp->inputCounter + cPos->array[i]],

               consts->getMat().entry(0, i));

  // std::cout << "SLEvaluatorConcrete(MutableMat): " << this << std::endl;

  nInputs = varsPos.size();

  nOutputs = slp->mOutputPositions.size();

}


template <typename RT>


SLEvaluator* SLEvaluatorConcrete<RT>::specialize(

    const MutableMatrix* parameters) const

{

  // std::cout << "SLEvaluatorConcrete::specialize:" << this << std::endl;

  auto p = dynamic_cast<const MutableMat<DMat<RT> >*>(parameters);

  if (p == nullptr)

    throw exc::engine_error("specialize: expected a dense mutable matrix");

  return specialize(p);

}


template <typename RT>


SLEvaluator* SLEvaluatorConcrete<RT>::specialize(

    const MutableMat<DMat<RT> >* parameters) const

{

  size_t nNewParams = parameters->n_rows();

  if (parameters->n_cols() != 1 || nNewParams > nInputs)

    throw exc::engine_error("1-column matrix expected; or #parameters > #vars");

  SLEvaluatorConcrete<RT>* e = new SLEvaluatorConcrete<RT>(*this);

  if (isCompiled) {

    e->nParams = nParams + nNewParams;

    e->nInputs -= nNewParams;

    delete[] e->parametersAndInputs;

    e->parametersAndInputs = new ElementType[e->nParams+e->nInputs];

    std::copy(parametersAndInputs, parametersAndInputs+nParams, e->parametersAndInputs); // old parameters values

    for (int i = 0; i < nNewParams; ++i)

      ring().set(e->parametersAndInputs[nParams+i], parameters->getMat().entry(i, 0));

  }

  else {

    for (int i = 0; i < nNewParams; ++i)

      ring().set(e->values[varsPos[i]], parameters->getMat().entry(i, 0));

    e->varsPos.erase(e->varsPos.begin(), e->varsPos.begin() + nNewParams);

    e->nInputs = e->varsPos.size();

    e->nParams = nParams + nNewParams;

  }

  return e;

}


template <typename RT>


void SLEvaluatorConcrete<RT>::computeNextNode()

{

  ElementType& v = *vIt;

  switch (*nIt++)

    {

      case SLProgram::MProduct:

        ring().set_from_long(v, 1);

        for (int i = 0; i < *numInputsIt; i++)

          ring().mult(v, v, *(vIt + (*inputPositionsIt++)));

        numInputsIt++;

        break;

      case SLProgram::MSum:

        ring().set_zero(v);

        for (int i = 0; i < *numInputsIt; i++)

          ring().add(v, v, *(vIt + (*inputPositionsIt++)));

        numInputsIt++;

        break;

      case SLProgram::Det:

        {

          int n = static_cast<int>(sqrt(*numInputsIt++));

          DMat<RT> mat(ring(), n, n);

          for (int i = 0; i < n; i++)

            for (int j = 0; j < n; j++)

              ring().set(mat.entry(i, j), *(vIt + (*inputPositionsIt++)));

          DMatLinAlg<RT>(mat).determinant(v);

        }

        break;

      case SLProgram::Divide:

        ring().set(v, *(vIt + (*inputPositionsIt++)));

        ring().divide(v, v, *(vIt + (*inputPositionsIt++)));

        break;

      default:

        std::cerr << "unknown node type\n";

        abort();

    }

}


template <typename RT>


bool SLEvaluatorConcrete<RT>::evaluate(const MutableMatrix* inputs,

                                       MutableMatrix* outputs)

{

  auto inp = dynamic_cast<const MutableMat<DMat<RT> >*>(inputs);

  auto out = dynamic_cast<MutableMat<DMat<RT> >*>(outputs);

  if (inp == nullptr)

    {

      ERROR("inputs: expected a dense mutable matrix");

      return false;

    }

  if (out == nullptr)

    {

      ERROR("outputs: expected a dense mutable matrix");

      return false;

    }

  if (&ring() != &inp->getMat().ring())

    {

      ERROR("inputs are in a different ring");

      return false;

    }

  if (&ring() != &out->getMat().ring())

    {

      ERROR("outputs are in a different ring");

      return false;

    }

  return evaluate(inp->getMat(), out->getMat());

}


template <typename RT>


bool SLEvaluatorConcrete<RT>::evaluate(const DMat<RT>& inputs,

                                       DMat<RT>& outputs)

{

  if (nInputs != inputs.numRows() * inputs.numColumns()) {

    ERROR(

          "inputs: the number of inputs does not match the number of entries "

          "in the inputs matrix");

    std::cout << nInputs

              << " != " << inputs.numRows() * inputs.numColumns()

              << std::endl;

    return false;

  }

  if (nOutputs != outputs.numRows() * outputs.numColumns()) {

    ERROR(

          "outputs: the number of outputs does not match the number of entries "

          "in the outputs matrix");

    std::cout << nOutputs << " != " << outputs.numRows()

              << " * " << outputs.numColumns() << std::endl;

    return false;

  }


  if (isCompiled) {

    if(parametersAndInputs==nullptr) {

      (*compiled_fn)(inputs.unsafeArray(), outputs.unsafeArray());

    } else {

      std::copy(inputs.unsafeArray(),inputs.unsafeArray()+nInputs,parametersAndInputs+nParams);

      (*compiled_fn)(parametersAndInputs, outputs.unsafeArray());

    }

    return true;

  } else {

    size_t i = 0;

    for (size_t r = 0; r < inputs.numRows(); r++)

      for (size_t c = 0; c < inputs.numColumns(); c++)

        ring().set(values[varsPos[i++]], inputs.entry(r, c));

    nIt = slp->mNodes.begin();

    numInputsIt = slp->mNumInputs.begin();

    inputPositionsIt = slp->mInputPositions.begin();

    for (vIt = values.begin() + slp->inputCounter; vIt != values.end(); ++vIt)

      computeNextNode();

    i = 0;

    for (size_t r = 0; r < outputs.numRows(); r++)

      for (size_t c = 0; c < outputs.numColumns(); c++)

        ring().set(outputs.entry(r, c), values[ap(slp->mOutputPositions[i++])]);

    return true;

  }

}


template <typename RT>


void SLEvaluatorConcrete<RT>::text_out(buffer& o) const

{

  if(isCompiled) {

    o << "compiled SLEvaluator("

      << nInputs << " inputs, "

      << nOutputs << " outputs, "

      << nParams << " parameters, mRing = ";

    ring().text_out(o);

    o << ")" << newline;

  } else {

    o << "SLEvaluator(slp = ";

    slp->text_out(o);

    o << ", mRing = ";

    ring().text_out(o);

    o << ")" << newline;

  }

}


template <typename RT>


Homotopy* SLEvaluatorConcrete<RT>::createHomotopy(SLEvaluator* Hxt,

                                                  SLEvaluator* HxH)

{

  auto castHxt = dynamic_cast<SLEvaluatorConcrete<RT>*>(Hxt);

  auto castHxH = dynamic_cast<SLEvaluatorConcrete<RT>*>(HxH);

  if (not castHxt or not castHxH)

    {

      ERROR("expected SLEvaluators in the same ring");

      return nullptr;

    }

  return new HomotopyConcrete<RT, typename HomotopyAlgorithm<RT>::Algorithm>(

      *this, *castHxt, *castHxH);

}


template <typename RT>


inline void norm2(const DMat<RT>& M,

                  size_t n,

                  typename RT::RealElementType& result)

{

  const auto& C = M.ring();

  const auto& R = C.real_ring();

  typename RT::RealRingType::Element c(R);

  R.set_zero(result);

  for (size_t i = 0; i < n; i++)

    {

      C.abs_squared(c, M.entry(0, i));

      R.add(result, result, c);

    }

}


enum SolutionStatus {

  UNDETERMINED,

  PROCESSING,

  REGULAR,

  SINGULAR,

  INFINITY_FAILED,

  MIN_STEP_FAILED,

  ORIGIN_FAILED,

  INCREASE_PRECISION,

  DECREASE_PRECISION

};


template <typename RT>


class ARingElement

{

  typename RT::ElementType mValue;

  const RT& mRing;


 public:

  ARingElement(const RT& R0) : mRing(R0) { mRing.init(mValue); }

  ~ARingElement() { mRing.clear(mValue); }

  typename RT::ElementType& get() { return mValue; }

  const typename RT::ElementType& get() const { return mValue; }

  const RT& ring() const { return mRing; }

  typename RT::RealElementType& getRealPart() { return realPart(mValue); }

};


// ****************************** XXX

// **************************************************

template <typename RT>


bool HomotopyConcrete<RT, FixedPrecisionHomotopyAlgorithm>::track(

    const MutableMatrix* inputs,

    MutableMatrix* outputs,

    MutableMatrix* output_extras,

    gmp_RR init_dt,

    gmp_RR min_dt,

    gmp_RR epsilon,  // o.CorrectorTolerance,

    int max_corr_steps,

    gmp_RR infinity_threshold,

    bool checkPrecision)

{

  std::chrono::steady_clock::time_point start =

      std::chrono::steady_clock::now();

  size_t solveLinearTime = 0, solveLinearCount = 0, evaluateTime = 0;


  // std::cout << "inside

  // HomotopyConcrete<RT,FixedPrecisionHomotopyAlgorithm>::track" << std::endl;

  // double the_smallest_number = 1e-13;

  const Ring* matRing = inputs->get_ring();

  if (outputs->get_ring() != matRing)

    {

      ERROR("outputs and inputs are in different rings");

      return false;

    }

  auto inp = dynamic_cast<const MutableMat<DMat<RT> >*>(inputs);

  auto out = dynamic_cast<MutableMat<DMat<RT> >*>(outputs);

  auto out_extras =

      dynamic_cast<MutableMat<DMat<M2::ARingZZGMP> >*>(output_extras);

  if (inp == nullptr)

    {

      ERROR("inputs: expected a dense mutable matrix");

      return false;

    }

  if (out == nullptr)

    {

      ERROR("outputs: expected a dense mutable matrix");

      return false;

    }

  if (out_extras == nullptr)

    {

      ERROR("output_extras: expected a dense mutable matrix");

      return false;

    }


  auto& in = inp->getMat();

  auto& ou = out->getMat();

  auto& oe = out_extras->getMat();

  size_t n_sols = in.numColumns();

  size_t n = in.numRows() - 1;  // number of x vars


  if (ou.numColumns() != n_sols or ou.numRows() != n + 2)

    {

      ERROR("output: wrong shape");

      return false;

    }

  if (oe.numColumns() != n_sols or oe.numRows() != 2)

    {

      ERROR("output_extras: wrong shape");

      return false;

    }


  const RT& C = in.ring();

  typename RT::RealRingType R = C.real_ring();


  typedef typename RT::ElementType ElementType;

  typedef typename RT::Element Element;

  typedef typename RT::RealRingType::Element RealElement;

  typedef typename RT::RealRingType::ElementType RealElementType;

  typedef MatElementaryOps<DMat<RT> > MatOps;


  RealElement t_step(R), min_step2(R), epsilon2(R), infinity_threshold2(R);

  R.set_from_BigReal(t_step, init_dt);  // initial step

  R.set_from_BigReal(min_step2, min_dt);

  R.mult(min_step2, min_step2, min_step2);  // min_step^2

  R.set_from_BigReal(epsilon2, epsilon);

  int tolerance_bits = int(log2(fabs(R.coerceToDouble(epsilon2))));

  R.mult(epsilon2, epsilon2, epsilon2);  // epsilon^2

  R.set_from_BigReal(infinity_threshold2, infinity_threshold);

  R.mult(infinity_threshold2, infinity_threshold2, infinity_threshold2);

  int num_successes_before_increase = 3;


  RealElement t0(R), dt(R), one_minus_t0(R), dx_norm2(R), x_norm2(R), abs2dc(R);


  // constants

  RealElement one(R), two(R), four(R), six(R), one_half(R), one_sixth(R);

  RealElementType& dt_factor = one_half;

  R.set_from_long(one, 1);

  R.set_from_long(two, 2);

  R.set_from_long(four, 4);

  R.set_from_long(six, 6);

  R.divide(one_half, one, two);

  R.divide(one_sixth, one, six);


  Element c_init(C), c_end(C), dc(C), one_half_dc(C);


  // think: x_0..x_(n-1), c

  // c = the homotopy continuation parameter "t" upstair, varies on a (staight

  // line) segment of complex plane (from c_init to c_end)

  // t = a real running in the interval [0,1]


  DMat<RT> x0c0(C, n + 1, 1);

  DMat<RT> x1c1(C, n + 1, 1);

  DMat<RT> xc(C, n + 1, 1);

  DMat<RT> HxH(C, n, n + 1);

  DMat<RT>& Hxt = HxH;  // the matrix has the same shape: reuse memory

  DMat<RT> LHSmat(C, n, n);

  auto LHS = submatrix(LHSmat);

  DMat<RT> RHSmat(C, n, 1);

  auto RHS = submatrix(RHSmat);

  DMat<RT> dx(C, n, 1);

  DMat<RT> dx1(C, n, 1);

  DMat<RT> dx2(C, n, 1);

  DMat<RT> dx3(C, n, 1);

  DMat<RT> dx4(C, n, 1);

  DMat<RT> Jinv_times_random(C, n, 1);


  ElementType& c0 = x0c0.entry(n, 0);

  ElementType& c1 = x1c1.entry(n, 0);

  ElementType& c = xc.entry(n, 0);

  RealElementType& tol2 = epsilon2;  // current tolerance squared

  bool linearSolve_success;

  for (size_t s = 0; s < n_sols; s++)

    {

      SolutionStatus status = PROCESSING;

      // set initial solution and initial value of the continuation parameter

      // for(size_t i=0; i<=n; i++)

      //  C.set(x0c0.entry(i,0), in.entry(i,s));

      submatrix(x0c0) = submatrix(const_cast<DMat<RT>&>(in), 0, s, n + 1, 1);

      C.set(c_init, c0);

      C.set(c_end, ou.entry(n, s));


      R.set_zero(t0);

      bool t0equals1 = false;


      // t_step is actually the initial (absolute) length of step on the

      // interval [c_init,c_end]

      // dt is an increment for t on the interval [0,1]

      R.set(dt, t_step);

      C.subtract(dc, c_end, c_init);

      C.abs(abs2dc, dc);  // don't want to create new temporary elts: reusing dc

                          // and abs2dc

      R.divide(dt, dt, abs2dc);


      int predictor_successes = 0;

      int count = 0;  // number of steps

      // track the real segment (1-t)*c0 + t*c1, a\in [0,1]

      while (status == PROCESSING and not t0equals1)

        {

          if (M2_numericalAlgebraicGeometryTrace > 3)

            {

              buffer o;

              R.elem_text_out(o, t0, true, false, false);

              std::cout << "t0 = " << o.str();

              o.reset();

              C.elem_text_out(o, c0, true, false, false);

              std::cout << ", c0 = " << o.str() << std::endl;

            }

          R.subtract(one_minus_t0, one, t0);

          if (R.compare_elems(dt, one_minus_t0) > 0)

            {

              R.set(dt, one_minus_t0);

              t0equals1 = true;

              C.subtract(dc, c_end, c0);

              C.set(c1, c_end);

            }

          else

            {

              C.subtract(dc, c_end, c0);

              C.mult(dc, dc, dt);

              C.divide(dc, dc, one_minus_t0);

              C.add(c1, c0, dc);

            }


          // PREDICTOR in: x0c0,dt

          //           out: dx

          /*  top-level code for Runge-Kutta-4

              dx1 := solveHxTimesDXequalsMinusHt(x0,t0);

              dx2 := solveHxTimesDXequalsMinusHt(x0+(1/2)*dx1*dt,t0+(1/2)*dt);

              dx3 := solveHxTimesDXequalsMinusHt(x0+(1/2)*dx2*dt,t0+(1/2)*dt);

              dx4 := solveHxTimesDXequalsMinusHt(x0+dx3*dt,t0+dt);

              (1/6)*dt*(dx1+2*dx2+2*dx3+dx4)

          */


          C.mult(one_half_dc, dc, one_half);


          // dx1

          submatrix(xc) = submatrix(x0c0);

          TIME(evaluateTime, mHxt.evaluate(xc, Hxt))


          LHS = submatrix(Hxt, 0, 0, n, n);

          RHS = submatrix(Hxt, 0, n, n, 1);

          MatrixOps::negateInPlace(RHSmat);


          TIME(solveLinearTime,

               linearSolve_success =

                   MatrixOps::solveLinear(LHSmat, RHSmat, dx1));

          solveLinearCount++;


          // dx2

          if (linearSolve_success)

            {

              submatrix(dx1) *= one_half_dc;  // "dx1" := (1/2)*dx1*dt

              submatrix(xc, 0, 0, n, 1) += submatrix(dx1);

              C.add(c, c, one_half_dc);


              TIME(evaluateTime, mHxt.evaluate(xc, Hxt))


              LHS = submatrix(Hxt, 0, 0, n, n);

              RHS = submatrix(Hxt, 0, n, n, 1);

              MatrixOps::negateInPlace(RHSmat);


              TIME(solveLinearTime,

                   linearSolve_success =

                       MatrixOps::solveLinear(LHSmat, RHSmat, dx2);)

              solveLinearCount++;

            }


          // dx3

          if (linearSolve_success)

            {

              submatrix(dx2) *= one_half_dc;  // "dx2" := (1/2)*dx2*dt

              submatrix(xc, 0, 0, n, 1) = submatrix(x0c0, 0, 0, n, 1);

              submatrix(xc, 0, 0, n, 1) += submatrix(dx2);

              // C.add(c,c,one_half_dc); // c should not change here??? or copy

              // c two lines above???


              TIME(evaluateTime, mHxt.evaluate(xc, Hxt));


              LHS = submatrix(Hxt, 0, 0, n, n);

              RHS = submatrix(Hxt, 0, n, n, 1);

              MatrixOps::negateInPlace(RHSmat);


              TIME(solveLinearTime,

                   linearSolve_success =

                       MatrixOps::solveLinear(LHSmat, RHSmat, dx3););

              solveLinearCount++;

            }


          // dx4

          if (linearSolve_success)

            {

              submatrix(dx3) *= dc;  // "dx3" := dx3*dt

              submatrix(xc) = submatrix(

                  x0c0);  // sets c=c0 as well (not needed for dx2???,dx3)

              submatrix(xc, 0, 0, n, 1) += submatrix(dx3);

              C.add(c, c, dc);


              TIME(evaluateTime, mHxt.evaluate(xc, Hxt));


              LHS = submatrix(Hxt, 0, 0, n, n);

              RHS = submatrix(Hxt, 0, n, n, 1);

              MatrixOps::negateInPlace(RHSmat);


              TIME(solveLinearTime,

                   linearSolve_success =

                       MatrixOps::solveLinear(LHSmat, RHSmat, dx4););

              solveLinearCount++;

            }


          // "dx1" = .5*dx1*dt, "dx2" = .5*dx2*dt, "dx3" = dx3*dt

          if (linearSolve_success)

            {

              submatrix(dx4) *= dc;  // "dx4" = dx4*dt

              submatrix(dx) =

                  submatrix(dx4);  // dx = (1/6)*dt*(dx1+2*dx2+2*dx3+dx4)

                                   //    = (1/6)*(2*"dx1"+4*"dx2"+2*"dx3"+"dx4")

              submatrix(dx1) *= two;

              submatrix(dx) += dx1;

              // submatrix(dx).addMultipleTo(two,dx1);

              submatrix(dx2) *= four;

              submatrix(dx) += dx2;

              submatrix(dx3) *= two;

              submatrix(dx) += dx3;

              submatrix(dx) *= one_sixth;


              // update x0c0

              submatrix(x1c1) = submatrix(x0c0);

              submatrix(x1c1, 0, 0, n, 1) += dx;

              C.add(c1, c0, dc);

            }


          // CORRECTOR

          bool is_successful;

          int n_corr_steps = 0;

          if (linearSolve_success)

            {

              do

                {

                  n_corr_steps++;


                  TIME(evaluateTime, mHxH.evaluate(x1c1, HxH));


                  LHS = submatrix(HxH, 0, 0, n, n);

                  RHS = submatrix(HxH, 0, n, n, 1);

                  MatrixOps::negateInPlace(RHSmat);


                  TIME(solveLinearTime,

                       linearSolve_success =

                           MatrixOps::solveLinear(LHSmat, RHSmat, dx););

                  solveLinearCount++;


                  // x1 += dx

                  submatrix(x1c1, 0, 0, n, 1) += dx;


                  normSquared(submatrix(dx), dx_norm2);

                  normSquared(submatrix(x1c1, 0, 0, n, 1), x_norm2);


                  R.mult(x_norm2, x_norm2, tol2);

                  is_successful = R.compare_elems(dx_norm2, x_norm2) < 0;

                }

              while (not is_successful and n_corr_steps < max_corr_steps);

            }

          // std::cout << "past corrector loop...\n";

          if (not linearSolve_success or not is_successful)

            {

              // predictor failure

              predictor_successes = 0;

              R.mult(dt, dt, dt_factor);

              t0equals1 = false;

              C.abs_squared(abs2dc, dc);

              if (R.compare_elems(abs2dc, min_step2) < 0)

                status = MIN_STEP_FAILED;

            }

          else

            {

              // predictor success

              predictor_successes = predictor_successes + 1;

              MatOps::setFromSubmatrix(x1c1, 0, n, 0, 0, x0c0);  // x1=x0

              R.add(t0, t0, dt);  // increment t: so far only s was incremented

              count++;

              if (predictor_successes >= num_successes_before_increase)

                {

                  predictor_successes = 0;

                  R.divide(dt, dt, dt_factor);

                }

            }


          normSquared(submatrix(x0c0, 0, 0, n, 1),

                      x_norm2);  // x_norm2 = ||x0||^2


          if (not linearSolve_success)

            status = SINGULAR;

          else if (checkPrecision and not t0equals1)

            {  // precision check

              mHxH.evaluate(x0c0, HxH);

              MatOps::setFromSubmatrix(HxH, 0, n - 1, 0, n - 1, LHSmat);  // Hx

              // setRandomUnitVector(RHSmat,n);

              for (int i = 0; i < n; i++) C.random(RHSmat.entry(i, 0));


              TIME(solveLinearTime,

                   linearSolve_success = MatrixOps::solveLinear(

                       LHSmat, RHSmat, Jinv_times_random););

              solveLinearCount++;


              norm2(Jinv_times_random,

                    n,

                    dx_norm2);  // this stands for ||J^{-1}||

//   ||J^{-1}|| should be multiplied by a factor

//   reflecting an estimate on the error of evaluation of J

#define PRECISION_SAFETY_BITS 10

              int more_bits = int(log2(fabs(R.coerceToDouble(dx_norm2)))) / 2;

              int precision_needed = PRECISION_SAFETY_BITS + tolerance_bits + more_bits;

              if (precision_needed<53) precision_needed = 53;

              if (M2_numericalAlgebraicGeometryTrace > 3)

                std::cout << "precision needed = " << precision_needed << " = "

                          << PRECISION_SAFETY_BITS << "(safety) + "

                          << tolerance_bits << "(tolerance) + "

                          << more_bits << "(additional)\n"

                          << "current precision = " << R.get_precision() << std::endl;

              if (R.get_precision() < precision_needed)

                 status = INCREASE_PRECISION;

              else if (R.get_precision() != 53 and

                       R.get_precision() > 2 * precision_needed)

                status = DECREASE_PRECISION;

              if (M2_numericalAlgebraicGeometryTrace > 3)

                std::cout << "status = " << status << std::endl;

            };


          // infinity/origin checks

          if (status == PROCESSING)

            {

              if (R.compare_elems(infinity_threshold2, x_norm2) < 0)

                status = INFINITY_FAILED;

              else

                {

                  if (R.is_zero(x_norm2))

                    status = ORIGIN_FAILED;

                  else

                    {

                      R.divide(x_norm2, one, x_norm2);  // 1/||x||^2

                      if (R.compare_elems(infinity_threshold2, x_norm2) < 0)

                        status = ORIGIN_FAILED;

                    }

                }

            }

        }

      // record the solution

      // set initial solution and initial value of the continuation parameter

      for (size_t i = 0; i <= n; i++) C.set(ou.entry(i, s), x0c0.entry(i, 0));

      C.set(ou.entry(n + 1, s), dc);  // store last increment attempted

      if (status == PROCESSING) status = REGULAR;

      oe.ring().set_from_long(oe.entry(0, s), status);

      oe.ring().set_from_long(oe.entry(1, s), count);

    }


  std::chrono::steady_clock::time_point end = std::chrono::steady_clock::now();

  if (M2_numericalAlgebraicGeometryTrace > 1)

    {

      std::cout << "-- track took "

                << std::chrono::duration_cast<std::chrono::milliseconds>(end -

                                                                         start)

                       .count()

                << "ms.\n";

      std::cout << "-- # of solveLinear calls = " << solveLinearCount

                << std::endl;

      std::cout << "-- time of solveLinear calls = " << solveLinearTime

                << " ns." << std::endl;

      std::cout << "-- time of evaluate calls = " << evaluateTime << " ns."

                << std::endl;

    }

  return true;

}


template <typename RT, typename Algorithm>


bool HomotopyConcrete<RT, Algorithm>::track(

    const MutableMatrix* inputs,

    MutableMatrix* outputs,

    MutableMatrix* output_extras,

    gmp_RR init_dt,

    gmp_RR min_dt,

    gmp_RR epsilon,  // o.CorrectorTolerance,

    int max_corr_steps,

    gmp_RR infinity_threshold,

    bool checkPrecision)

{

  (void) inputs;

  (void) outputs;

  (void) output_extras;

  (void) init_dt;

  (void) min_dt;

  (void) epsilon;

  (void) max_corr_steps;

  (void) infinity_threshold;

  (void) checkPrecision;

  ERROR("track: not implemented for this type of ring");

  return false;

}


template <typename RT, typename Algorithm>


void HomotopyConcrete<RT, Algorithm>::text_out(buffer& o) const

{

  o << "HomotopyConcrete<...,...> : track not implemented" << newline;

}


template <typename RT>


HomotopyConcrete<RT, FixedPrecisionHomotopyAlgorithm>::HomotopyConcrete(

    HomotopyConcrete<RT, FixedPrecisionHomotopyAlgorithm>::EType& Hx,

    HomotopyConcrete<RT, FixedPrecisionHomotopyAlgorithm>::EType& Hxt,

    HomotopyConcrete<RT, FixedPrecisionHomotopyAlgorithm>::EType& HxH)

    : mHx(Hx), mHxt(Hxt), mHxH(HxH)

{

}


template <typename RT>


void HomotopyConcrete<RT, FixedPrecisionHomotopyAlgorithm>::text_out(

    buffer& o) const

{

  o << "HomotopyConcrete<...,fixed precision>(Hx = ";

  mHx.text_out(o);

  o << ", Hxt = ";

  mHxt.text_out(o);

  o << ", HxH = ";

  mHxH.text_out(o);

  o << ")" << newline;

}


#endif


// Local Variables:

// compile-command: "make -C $M2BUILDDIR/Macaulay2/e "

// indent-tabs-mode: nil

// End:

dlsym
#define dlsym(x, y)
Definition NAG.cpp:15

dlopen
#define dlopen(x, y)
Definition NAG.cpp:14

PRECISION_SAFETY_BITS
#define PRECISION_SAFETY_BITS

SolutionStatus
SolutionStatus
Definition SLP-imp.hpp:353

PROCESSING
@ PROCESSING
Definition SLP-imp.hpp:355

INFINITY_FAILED
@ INFINITY_FAILED
Definition SLP-imp.hpp:358

ORIGIN_FAILED
@ ORIGIN_FAILED
Definition SLP-imp.hpp:360

INCREASE_PRECISION
@ INCREASE_PRECISION
Definition SLP-imp.hpp:361

DECREASE_PRECISION
@ DECREASE_PRECISION
Definition SLP-imp.hpp:362

MIN_STEP_FAILED
@ MIN_STEP_FAILED
Definition SLP-imp.hpp:359

UNDETERMINED
@ UNDETERMINED
Definition SLP-imp.hpp:354

SINGULAR
@ SINGULAR
Definition SLP-imp.hpp:357

REGULAR
@ REGULAR
Definition SLP-imp.hpp:356

norm2
void norm2(const DMat< RT > &M, size_t n, typename RT::RealElementType &result)
Definition SLP-imp.hpp:338

ARingElement::ring
const RT & ring() const
Definition SLP-imp.hpp:376

ARingElement::get
RT::ElementType & get()
Definition SLP-imp.hpp:374

ARingElement::ARingElement
ARingElement(const RT &R0)
Definition SLP-imp.hpp:372

ARingElement::get
const RT::ElementType & get() const
Definition SLP-imp.hpp:375

ARingElement::~ARingElement
~ARingElement()
Definition SLP-imp.hpp:373

ARingElement::mValue
RT::ElementType mValue
Definition SLP-imp.hpp:368

ARingElement::mRing
const RT & mRing
Definition SLP-imp.hpp:369

ARingElement::getRealPart
RT::RealElementType & getRealPart()
Definition SLP-imp.hpp:377

DMat::numRows
size_t numRows() const
Definition dmat.hpp:144

DMat::entry
ElementType & entry(size_t row, size_t column)
Definition dmat.hpp:148

DMat::ring
const ACoeffRing & ring() const
Definition dmat.hpp:143

DMat::unsafeArray
const ElementType * unsafeArray() const
Definition dmat.hpp:170

DMat::numColumns
size_t numColumns() const
Definition dmat.hpp:145

DMat
Definition dmat.hpp:62

DMatLinAlg::determinant
void determinant(ElementType &result)
Output: result, the determinant of A.
Definition dmat-lu.hpp:308

DMatLinAlg
Definition dmat-lu.hpp:58

HomotopyConcrete< RT, FixedPrecisionHomotopyAlgorithm >::mHxt
EType & mHxt
Definition SLP-defs.hpp:435

HomotopyConcrete< RT, FixedPrecisionHomotopyAlgorithm >::mHx
EType & mHx
Definition SLP-defs.hpp:435

HomotopyConcrete< RT, FixedPrecisionHomotopyAlgorithm >::mHxH
EType & mHxH
Definition SLP-defs.hpp:435

HomotopyConcrete::text_out
void text_out(buffer &o) const
Definition SLP-imp.hpp:833

HomotopyConcrete::HomotopyConcrete
HomotopyConcrete(EType &Hx, EType &Hxt, EType &HxH)
Definition SLP-defs.hpp:382

HomotopyConcrete::track
bool track(const MutableMatrix *inputs, MutableMatrix *outputs, MutableMatrix *output_extras, gmp_RR init_dt, gmp_RR min_dt, gmp_RR epsilon, int max_corr_steps, gmp_RR infinity_threshold, bool checkPrecision)
Definition SLP-imp.hpp:808

HomotopyConcrete::EType
SLEvaluatorConcrete< RT > EType
Definition SLP-defs.hpp:380

HomotopyConcrete
Definition SLP-defs.hpp:378

Homotopy
Abstract base for the predictor-corrector path-tracker hierarchy.
Definition SLP-defs.hpp:361

M2_arrayint

MatElementaryOps
Definition mat-arith.hpp:41

MutableMat::getMat
Mat & getMat()
Definition mutablemat-defs.hpp:283

MutableMat
Definition mutablemat-defs.hpp:241

MutableMatrix::get_ring
virtual const Ring * get_ring() const =0

MutableMatrix
Abstract base class for mutable matrices over an arbitrary engine Ring, the in-place counterpart of t...
Definition mat.hpp:79

Ring
xxx xxx xxx
Definition ring.hpp:102

SLEvaluator::nIt
std::vector< SLProgram::GATE_TYPE >::iterator nIt
Definition SLP-defs.hpp:284

SLEvaluator::numInputsIt
std::vector< SLProgram::GATE_SIZE >::iterator numInputsIt
Definition SLP-defs.hpp:285

SLEvaluator::ap
int ap(int rp)
Definition SLP-defs.hpp:280

SLEvaluator::inputPositionsIt
std::vector< SLProgram::GATE_POSITION >::iterator inputPositionsIt
Definition SLP-defs.hpp:286

SLEvaluator::varsPos
std::vector< SLProgram::GATE_POSITION > varsPos
!! can we make it a reference???
Definition SLP-defs.hpp:283

SLEvaluator::slp
SLProgram * slp
Definition SLP-defs.hpp:282

SLEvaluatorConcrete::createHomotopy
Homotopy * createHomotopy(SLEvaluator *Hxt, SLEvaluator *HxH)
Definition SLP-imp.hpp:323

SLEvaluatorConcrete::ring
const RT & ring() const
Definition SLP-defs.hpp:319

SLEvaluatorConcrete::isCompiled
bool isCompiled
Definition SLP-defs.hpp:333

SLEvaluatorConcrete::evaluate
bool evaluate(const MutableMatrix *inputs, MutableMatrix *outputs)
Definition SLP-imp.hpp:227

SLEvaluatorConcrete::values
std::vector< ElementType > values
Definition SLP-defs.hpp:337

SLEvaluatorConcrete::~SLEvaluatorConcrete
~SLEvaluatorConcrete()
Definition SLP-imp.hpp:119

SLEvaluatorConcrete::computeNextNode
void computeNextNode()
Definition SLP-imp.hpp:189

SLEvaluatorConcrete::specialize
SLEvaluator * specialize(const MutableMatrix *parameters) const
Definition SLP-imp.hpp:151

SLEvaluatorConcrete::vIt
std::vector< ElementType >::iterator vIt
Definition SLP-defs.hpp:329

SLEvaluatorConcrete::nOutputs
int nOutputs
Definition SLP-defs.hpp:334

SLEvaluatorConcrete::compiled_fn
void(* compiled_fn)(ElementType const *, ElementType *)
Definition SLP-defs.hpp:342

SLEvaluatorConcrete::nParams
int nParams
Definition SLP-defs.hpp:343

SLEvaluatorConcrete::parametersAndInputs
ElementType * parametersAndInputs
Definition SLP-defs.hpp:344

SLEvaluatorConcrete::mRing
const RT & mRing
Definition SLP-defs.hpp:332

SLEvaluatorConcrete::nInputs
int nInputs
Definition SLP-defs.hpp:334

SLEvaluatorConcrete::SLEvaluatorConcrete
SLEvaluatorConcrete(const SLEvaluatorConcrete< RT > &)
Definition SLP-imp.hpp:103

SLEvaluatorConcrete::text_out
void text_out(buffer &o) const
Definition SLP-imp.hpp:304

SLEvaluatorConcrete::ElementType
typename RT::ElementType ElementType
Definition SLP-defs.hpp:328

SLEvaluator
Abstract base for the SLP evaluator hierarchy.
Definition SLP-defs.hpp:270

SLP
Definition NAG.hpp:485

SLProgram::Det
@ Det
Definition SLP-defs.hpp:91

SLProgram::Divide
@ Divide
Definition SLP-defs.hpp:91

SLProgram::MSum
@ MSum
Definition SLP-defs.hpp:91

SLProgram::MProduct
@ MProduct
Definition SLP-defs.hpp:91

SLProgram
A straight-line program: a directed acyclic graph of arithmetic gates over a fixed list of inputs and...
Definition SLP-defs.hpp:89

SMat
Definition smat.hpp:43

buffer::str
char * str()
Definition buffer.hpp:72

buffer::reset
void reset()
Definition buffer.hpp:69

buffer
Definition buffer.hpp:55

int

p
int p
Definition godboltTest.cpp:36

s
void size_t s
Definition m2-mem.cpp:271

ERROR
const int ERROR
Definition m2-mem.cpp:55

result
VALGRIND_MAKE_MEM_DEFINED & result(result)

M2_numericalAlgebraicGeometryTrace
int M2_numericalAlgebraicGeometryTrace
Definition m2-types.cpp:53

newline
char newline[]
Definition m2-types.cpp:49

gmp_RR
mpfr_srcptr gmp_RR
Definition m2-types.h:148

normSquared
void normSquared(SubMatrix< MatType > M, typename MatType::CoeffRing::RealElementType &result)
Definition mat-arith.hpp:185

submatrix
SubMatrix< MatType > submatrix(MatType &m)
Definition mat-arith.hpp:201

MatrixOps::negateInPlace
void negateInPlace(DMat< RT > &A)
Definition mat-arith.hpp:243

MatrixOps::solveLinear
bool solveLinear(const Mat &A, const Mat &B, Mat &X)
solve AX=B, return true if the system has a solution.
Definition mat-linalg.hpp:230

end
TermIterator< Nterm > end(Nterm *)
Definition ringelem.cpp:5

exc::engine_error
Definition exceptions.hpp:42

TIME
#define TIME(t, call)
Definition timing.hpp:67

timing.hpp
Inline std::chrono::steady_clock wrappers and elapsed-time conversion helpers.

string_M2_to_std
std::string string_M2_to_std(const M2_string s)
Definition util.hpp:47