89 Real zerotol = std::sqrt(ROL_EPSILON<Real>());
91 ROL::Ptr<Vector<Real> > n = xvec_->clone();
92 ROL::Ptr<Vector<Real> > c = cvec_->clone();
93 ROL::Ptr<Vector<Real> > t = xvec_->clone();
94 ROL::Ptr<Vector<Real> > tCP = xvec_->clone();
95 ROL::Ptr<Vector<Real> > g = gvec_->clone();
96 ROL::Ptr<Vector<Real> > gf = gvec_->clone();
97 ROL::Ptr<Vector<Real> > Wg = xvec_->clone();
98 ROL::Ptr<Vector<Real> > ajl = gvec_->clone();
101 ROL::Ptr<Vector<Real> > l_new = lvec_->clone();
102 ROL::Ptr<Vector<Real> > c_new = cvec_->clone();
103 ROL::Ptr<Vector<Real> > g_new = gvec_->clone();
104 ROL::Ptr<Vector<Real> > gf_new = gvec_->clone();
107 f = obj.
value(x, zerotol);
112 con.
value(*c, x, zerotol);
115 computeQuasinormalStep(*n, *c, x, zeta_*Delta_, con, os);
124 solveTangentialSubproblem(*t, *tCP, *Wg, x, *g, *n, l, Delta_, obj, con, os);
125 totalIterCG_ += iterCG_;
128 accept(s, *n, *t, f_new, *c_new, *gf_new, *l_new, *g_new, x, l, f, *gf, *c, *g, *tCP, *Wg, obj, con, os);
192 os <<
"\n Quasi-normal step\n";
198 Real zerotol = std::sqrt(ROL_EPSILON<Real>());
199 std::vector<Real> augiters;
202 Ptr<Vector<Real> > nCP = xvec_->clone();
203 Ptr<Vector<Real> > nCPdual = gvec_->clone();
204 Ptr<Vector<Real> > nN = xvec_->clone();
205 Ptr<Vector<Real> > ctemp = cvec_->clone();
206 Ptr<Vector<Real> > dualc0 = lvec_->clone();
207 dualc0->set(c.
dual());
209 nCP->set(nCPdual->dual());
212 Real normsquare_ctemp = ctemp->dot(*ctemp);
213 if (normsquare_ctemp !=
zero) {
214 nCP->scale( -(nCP->dot(*nCP))/normsquare_ctemp );
219 Real norm_nCP = nCP->norm();
220 if (norm_nCP >= delta) {
222 n.
scale( delta/norm_nCP );
225 os <<
" taking partial Cauchy step\n";
236 Real tol = setTolOSS(qntol_*ctemp->norm());
239 nCPdual->set(nCP->dual());
240 nCPdual->scale(-one);
242 Ptr<Vector<Real> > dn = xvec_->clone();
243 Ptr<Vector<Real> > y = lvec_->clone();
247 totalIterLS_ = totalIterLS_ + augiters.size();
248 printInfoLS(augiters, os);
255 Real norm_nN = nN->norm();
256 if (norm_nN <= delta) {
261 os <<
" taking full Newton step\n";
269 Real aa = dn->dot(*dn);
270 Real bb = dn->dot(*nCP);
271 Real cc = norm_nCP*norm_nCP - delta*delta;
272 Real tau = (-bb+sqrt(bb*bb-aa*cc))/aa;
277 os <<
" taking dogleg step\n";
299 bool orthocheck =
true;
301 Real tol_ortho = 0.5;
308 Real zerotol = std::sqrt(ROL_EPSILON<Real>());
309 std::vector<Real> augiters;
314 Ptr<Vector<Real> > r = gvec_->clone();
315 Ptr<Vector<Real> > pdesc = xvec_->clone();
316 Ptr<Vector<Real> > tprev = xvec_->clone();
317 Ptr<Vector<Real> > Wr = xvec_->clone();
318 Ptr<Vector<Real> > Hp = gvec_->clone();
319 Ptr<Vector<Real> > xtemp = xvec_->clone();
320 Ptr<Vector<Real> > gtemp = gvec_->clone();
321 Ptr<Vector<Real> > ltemp = lvec_->clone();
322 Ptr<Vector<Real> > czero = cvec_->clone();
325 obj.
hessVec(*gtemp, n, x, zerotol);
331 Real normg = r->norm();
339 std::vector<Real> normWr(maxiterCG_+1,
zero);
341 std::vector<Ptr<Vector<Real > > > p;
342 std::vector<Ptr<Vector<Real > > > Hps;
343 std::vector<Ptr<Vector<Real > > > rs;
344 std::vector<Ptr<Vector<Real > > > Wrs;
349 std::ios_base::fmtflags osFlags(os.flags());
350 os <<
"\n Tangential subproblem\n";
351 os << std::setw(6) << std::right <<
"iter" << std::setw(18) <<
"||Wr||/||Wr0||" << std::setw(15) <<
"||s||";
352 os << std::setw(15) <<
"delta" << std::setw(15) <<
"||c'(x)s||" <<
"\n";
359 os <<
" >>> Tangential subproblem: Initial gradient is zero! \n";
362 iterCG_ = 0; Wg.
zero(); flagCG_ = 0;
367 while (iterCG_ < maxiterCG_) {
377 Real tol = setTolOSS(pgtol_);
380 totalIterLS_ = totalIterLS_ + augiters.size();
381 printInfoLS(augiters, os);
386 Wrs.push_back(xvec_->clone());
387 (Wrs[iterCG_-1])->set(*Wr);
390 if (normWg ==
zero) {
395 os <<
" Initial projected residual is close to zero! \n";
404 rs.push_back(xvec_->clone());
406 (rs[0])->set(r->dual());
411 Real tol = setTolOSS(projtol_);
414 totalIterLS_ = totalIterLS_ + augiters.size();
415 printInfoLS(augiters, os);
418 Wrs.push_back(xvec_->clone());
419 (Wrs[iterCG_-1])->set(*Wr);
423 normWr[iterCG_-1] = Wr->norm();
426 Ptr<Vector<Real> > ct = cvec_->clone();
428 Real linc = ct->norm();
429 std::ios_base::fmtflags osFlags(os.flags());
430 os << std::scientific << std::setprecision(6);
431 os << std::setw(6) << std::right << iterCG_-1 << std::setw(18) << normWr[iterCG_-1]/normWg << std::setw(15) << t.
norm();
432 os << std::setw(15) << delta << std::setw(15) << linc <<
"\n";
437 if (normWr[iterCG_-1]/normWg < tolCG_) {
442 os <<
" || W(g + H*(n+s)) || <= cgtol*|| W(g + H*n)|| \n";
450 LA::Matrix<Real> Wrr(iterCG_,iterCG_);
451 LA::Matrix<Real> T(iterCG_,iterCG_);
452 LA::Matrix<Real> Tm1(iterCG_,iterCG_);
453 for (
int i=0; i<iterCG_; i++) {
454 for (
int j=0; j<iterCG_; j++) {
455 Wrr(i,j) = (Wrs[i])->dot(*rs[j]);
456 T(i,j) = Wrr(i,j)/(normWr[i]*normWr[j]);
459 Tm1(i,j) = Tm1(i,j) - one;
463 if (Tm1.normOne() >= tol_ortho) {
464 LAPACK<int,Real> lapack;
465 std::vector<int> ipiv(iterCG_);
467 std::vector<Real> work(3*iterCG_);
469 lapack.GETRF(iterCG_, iterCG_, T.values(), T.stride(), &ipiv[0], &info);
470 lapack.GETRI(iterCG_, T.values(), T.stride(), &ipiv[0], &work[0], 3*iterCG_, &info);
472 for (
int i=0; i<iterCG_; i++) {
473 Tm1(i,i) = Tm1(i,i) - one;
475 if (Tm1.normOne() > S_max) {
479 os <<
" large nonorthogonality in W(R)'*R detected \n";
488 p.push_back(xvec_->clone());
489 (p[iterCG_-1])->set(*Wr);
490 (p[iterCG_-1])->scale(-one);
491 for (
int j=1; j<iterCG_; j++) {
492 Real scal = (p[iterCG_-1])->dot(*(Hps[j-1])) / (p[j-1])->dot(*(Hps[j-1]));
493 Ptr<Vector<Real> > pj = xvec_->clone();
496 (p[iterCG_-1])->plus(*pj);
500 Hps.push_back(xvec_->clone());
502 obj.
hessVec(*Hp, *(p[iterCG_-1]), x, zerotol);
509 (Hps[iterCG_-1])->set(Hp->dual());
511 pHp = (p[iterCG_-1])->dot(*(Hps[iterCG_-1]));
513 rp = (p[iterCG_-1])->dot(*(rs[iterCG_-1]));
515 normp = (p[iterCG_-1])->norm();
520 pdesc->set(*(p[iterCG_-1]));
521 if ((std::abs(rp) >= rptol*normp*normr) && (sgn(rp) == 1)) {
525 Real a = pdesc->dot(*pdesc);
526 Real b = pdesc->dot(t);
527 Real c = t.
dot(t) - delta*delta;
529 Real theta = (-b + std::sqrt(b*b - a*c)) / a;
530 xtemp->set(*(p[iterCG_-1]));
539 os <<
" negative curvature detected \n";
546 if (std::abs(rp) < rptol*normp*normr) {
550 os <<
" Zero alpha due to inexactness. \n";
560 xtemp->set(*(p[iterCG_-1]));
566 if (normt >= delta) {
567 pdesc->set(*(p[iterCG_-1]));
571 Real a = pdesc->dot(*pdesc);
572 Real b = pdesc->dot(*tprev);
573 Real c = tprev->dot(*tprev) - delta*delta;
575 Real theta = (-b + std::sqrt(b*b - a*c)) / a;
576 xtemp->set(*(p[iterCG_-1]));
587 os <<
" trust-region condition active \n";
594 xtemp->set(*(Hps[iterCG_-1]));
597 r->plus(xtemp->dual());
600 rs.push_back(xvec_->clone());
602 (rs[iterCG_])->set(r->dual());
612 os <<
" maximum number of iterations reached \n";
627 Real tol_red_tang = 1e-3;
628 Real tol_red_all = 1e-1;
631 Real tol_fdiff = 1e-12;
636 Real rpred_over_pred = 0.5*(1-eta_);
640 os <<
"\n Composite step acceptance\n";
648 Real zerotol = std::sqrt(ROL_EPSILON<Real>());
649 std::vector<Real> augiters;
654 Real part_pred =
zero;
655 Real linc_preproj =
zero;
656 Real linc_postproj =
zero;
657 Real tangtol_start =
zero;
658 Real tangtol = tangtol_;
662 bool try_tCP =
false;
665 Ptr<Vector<Real> > xtrial = xvec_->clone();
666 Ptr<Vector<Real> > Jl = gvec_->clone();
667 Ptr<Vector<Real> > gfJl = gvec_->clone();
668 Ptr<Vector<Real> > Jnc = cvec_->clone();
669 Ptr<Vector<Real> > t_orig = xvec_->clone();
670 Ptr<Vector<Real> > t_dual = gvec_->clone();
671 Ptr<Vector<Real> > Jt_orig = cvec_->clone();
672 Ptr<Vector<Real> > t_m_tCP = xvec_->clone();
673 Ptr<Vector<Real> > ltemp = lvec_->clone();
674 Ptr<Vector<Real> > xtemp = xvec_->clone();
675 Ptr<Vector<Real> > rt = cvec_->clone();
676 Ptr<Vector<Real> > Hn = gvec_->clone();
677 Ptr<Vector<Real> > Hto = gvec_->clone();
678 Ptr<Vector<Real> > cxxvec = gvec_->clone();
679 Ptr<Vector<Real> > czero = cvec_->clone();
681 Real Jnc_normsquared =
zero;
682 Real c_normsquared =
zero;
689 Jnc_normsquared = Jnc->dot(*Jnc);
690 c_normsquared = c.
dot(c);
692 for (
int ct=0; ct<ct_max; ct++) {
696 t_m_tCP->scale(-one);
698 if (t_m_tCP->norm() ==
zero) {
704 linc_preproj = Jt_orig->norm();
706 rpred = two*rpred_over_pred*pred;
709 tangtol_start = tangtol;
711 while (std::abs(rpred)/pred > rpred_over_pred) {
714 tangtol = tol_red_tang*tangtol;
716 if (tangtol < mintol) {
719 os <<
"\n The projection of the tangential step cannot be done with sufficient precision.\n";
720 os <<
" Is the quasi-normal step very small? Continuing with no global convergence guarantees.\n";
727 Real tol = setTolOSS(tangtol);
729 t_dual->set(t_orig->dual());
732 totalIterLS_ = totalIterLS_ + augiters.size();
733 printInfoLS(augiters, os);
736 linc_postproj = rt->norm();
743 obj.
hessVec(*Hn, n, x, zerotol);
748 obj.
hessVec(*Hto, *t_orig, x, zerotol);
759 f_new = obj.
value(*xtrial, zerotol);
760 obj.
gradient(gf_new, *xtrial, zerotol);
761 con.
value(c_new, *xtrial, zerotol);
763 computeLagrangeMultiplier(l_new, *xtrial, gf_new, con, os);
766 part_pred = - Wg.
dot(*t_orig);
771 part_pred -= n.
apply(*gfJl);
774 part_pred -= half*n.
apply(*Hn);
777 part_pred -= half*t_orig->apply(*Hto);
779 ltemp->axpy(-one, l);
782 part_pred -= Jnc->apply(*ltemp);
784 if ( part_pred < -half*penalty_*(c_normsquared-Jnc_normsquared) ) {
785 penalty_ = ( -two * part_pred / (c_normsquared-Jnc_normsquared) ) + beta;
788 pred = part_pred + penalty_*(c_normsquared-Jnc_normsquared);
793 rpred = - rt->apply(*ltemp) - penalty_ * rt->dot(*rt) - two * penalty_ * rt->dot(*Jnc);
801 tangtol = tangtol_start;
807 if ( t_orig->norm()/xtemp->norm() < tntmax_ ) {
811 t_m_tCP->set(*t_orig);
812 t_m_tCP->scale(-one);
814 if ((t_m_tCP->norm() > 0) && try_tCP) {
817 os <<
" ---> now trying tangential Cauchy point\n";
825 os <<
" ---> recomputing quasi-normal step and re-solving tangential subproblem\n";
845 lmhtol_ *= tol_red_all;
846 qntol_ *= tol_red_all;
847 pgtol_ *= tol_red_all;
848 projtol_ *= tol_red_all;
849 tangtol_ *= tol_red_all;
852 computeQuasinormalStep(n, c, x, zeta_*Delta_, con, os);
854 solveTangentialSubproblem(t, tCP, Wg, x, g, n, l, Delta_, obj, con, os);
855 totalIterCG_ += iterCG_;
870 if (std::abs(fdiff / (f+em24)) < tol_fdiff) {
876 ared = fdiff + (c.
apply(l) - c_new.
apply(l_new)) + penalty_*(c.
dot(c) - c_new.
dot(c_new));
889 std::ios_base::fmtflags osFlags(os.flags());
890 os << std::scientific << std::setprecision(6);
891 os <<
"\n Trial step info ...\n";
892 os <<
" n_norm = " << nnorm_ <<
"\n";
893 os <<
" t_norm = " << tnorm_ <<
"\n";
894 os <<
" s_norm = " << snorm_ <<
"\n";
895 os <<
" xtrial_norm = " << xtrial->norm() <<
"\n";
896 os <<
" f_old = " << f <<
"\n";
897 os <<
" f_trial = " << f_new <<
"\n";
898 os <<
" f_old-f_trial = " << f-f_new <<
"\n";
899 os <<
" ||c_old|| = " << c.
norm() <<
"\n";
900 os <<
" ||c_trial|| = " << c_new.
norm() <<
"\n";
901 os <<
" ||Jac*t_preproj|| = " << linc_preproj <<
"\n";
902 os <<
" ||Jac*t_postproj|| = " << linc_postproj <<
"\n";
903 os <<
" ||t_tilde||/||t|| = " << t_orig->norm() / t.
norm() <<
"\n";
904 os <<
" ||t_tilde||/||n+t|| = " << t_orig->norm() / snorm_ <<
"\n";
905 os <<
" # projections = " << num_proj <<
"\n";
906 os <<
" penalty param = " << penalty_ <<
"\n";
907 os <<
" ared = " << ared_ <<
"\n";
908 os <<
" pred = " << pred_ <<
"\n";
909 os <<
" ared/pred = " << ared_/pred_ <<
"\n";
1111 std::ios_base::fmtflags osFlags(os.flags());
1112 os << std::scientific << std::setprecision(6);
1113 if (state_->iter == 0) writeName(os);
1114 if (print_header) writeHeader(os);
1115 if (state_->iter == 0 ) {
1117 os << std::setw(6) << std::left << state_->iter;
1118 os << std::setw(15) << std::left << state_->value;
1119 os << std::setw(15) << std::left << state_->cnorm;
1120 os << std::setw(15) << std::left << state_->gnorm;
1121 os << std::setw(15) << std::left <<
"---";
1122 os << std::setw(10) << std::left <<
"---";
1123 os << std::setw(10) << std::left <<
"---";
1124 os << std::setw(10) << std::left <<
"---";
1125 os << std::setw(8) << std::left <<
"---";
1126 os << std::setw(8) << std::left <<
"---";
1127 os << std::setw(8) << std::left <<
"---";
1128 os << std::setw(8) << std::left <<
"---";
1129 os << std::setw(8) << std::left <<
"---";
1130 os << std::setw(8) << std::left <<
"---";
1135 os << std::setw(6) << std::left << state_->iter;
1136 os << std::setw(15) << std::left << state_->value;
1137 os << std::setw(15) << std::left << state_->cnorm;
1138 os << std::setw(15) << std::left << state_->gnorm;
1139 os << std::setw(15) << std::left << state_->snorm;
1140 os << std::scientific << std::setprecision(2);
1141 os << std::setw(10) << std::left << Delta_;
1142 os << std::setw(10) << std::left << nnorm_;
1143 os << std::setw(10) << std::left << tnorm_;
1144 os << std::scientific << std::setprecision(6);
1145 os << std::setw(8) << std::left << state_->nfval;
1146 os << std::setw(8) << std::left << state_->ngrad;
1147 os << std::setw(8) << std::left << iterCG_;
1148 os << std::setw(8) << std::left << flagCG_;
1149 os << std::setw(8) << std::left << flagAC_;
1150 os << std::left << totalCallLS_ <<
"/" << totalIterLS_;
void accept(Vector< Real > &s, Vector< Real > &n, Vector< Real > &t, Real f_new, Vector< Real > &c_new, Vector< Real > &gf_new, Vector< Real > &l_new, Vector< Real > &g_new, const Vector< Real > &x, const Vector< Real > &l, Real f, const Vector< Real > &gf, const Vector< Real > &c, const Vector< Real > &g, Vector< Real > &tCP, Vector< Real > &Wg, Objective< Real > &obj, Constraint< Real > &con, std::ostream &os)
Check acceptance of subproblem solutions, adjust merit function penalty parameter,...