Get rid of assumptions, which always did cause trouble. Instead,

solve the Newton's method iterations in a least squares sense. This is much less likely to result in numerical disaster; a parameter will never make a very large change, unless that really is the only way to satisfy the constraints. [git-p4: depot-paths = "//depot/solvespace/": change = 1717]
2008-05-11 23:29:50 -08:00 · 2008-05-11 23:29:50 -08:00 · f4d2651031
commit f4d2651031
parent e2263c69c8
2 changed files with 66 additions and 116 deletions
--- a/solvespace.h
+++ b/solvespace.h
@ -112,8 +112,6 @@ public:
        // The corresponding parameter for each column
        hParam      param[MAX_UNKNOWNS];
        // The desired permutation, when we are sorting by sensitivity.
        int         permutation[MAX_UNKNOWNS];
        bool        bound[MAX_UNKNOWNS];
@ -124,11 +122,10 @@ public:
            double       num[MAX_UNKNOWNS][MAX_UNKNOWNS];
        }           A;
-        // Extra information about each unknown: whether it's being dragged
+        // Some helpers for the least squares solve
-        // or not (in which case it should get assumed preferentially), and
+        double AAt[MAX_UNKNOWNS][MAX_UNKNOWNS];
-        // the sensitivity used to decide the order in which things get
+        double Z[MAX_UNKNOWNS];
-        // assumed.
+
        double      sens[MAX_UNKNOWNS];
        double      X[MAX_UNKNOWNS];
        struct {
@ -138,13 +135,14 @@ public:
    } mat;
    bool Tol(double v);
-    void GaussJordan(void);
+    int GaussJordan(void);
-    bool SolveLinearSystem(void);
+    static bool SolveLinearSystem(double X[], double A[][MAX_UNKNOWNS],
                                  double B[], int N);
    bool SolveLeastSquares(void);
    void WriteJacobian(int eqTag, int paramTag);
    void EvalJacobian(void);
    void SortBySensitivity(void);
    void SolveBySubstitution(void);
    static bool IsDragged(hParam p);
--- a/system.cpp
+++ b/system.cpp
@ -28,6 +28,7 @@ void System::WriteJacobian(int eqTag, int paramTag) {
            if(scoreboard & (1 << (mat.param[j].v % 31))) { 
                pd = f->PartialWrt(mat.param[j]);
                pd = pd->FoldConstants();
                pd = pd->DeepCopyWithParamsAsPointers(&param, &(SS.param));
            } else {
                pd = Expr::FromConstant(0);
            }
@ -144,73 +145,11 @@ void System::SolveBySubstitution(void) {
    }
 }
 static int BySensitivity(const void *va, const void *vb) {
    const int *a = (const int *)va, *b = (const int *)vb;
    hParam pa = SS.sys.mat.param[*a];
    hParam pb = SS.sys.mat.param[*b];
    if(System::IsDragged(pa) && !System::IsDragged(pb)) return  1;
    if(System::IsDragged(pb) && !System::IsDragged(pa)) return -1;
    double as = SS.sys.mat.sens[*a];
    double bs = SS.sys.mat.sens[*b];
    if(as < bs) return  1;
    if(as > bs) return -1;
    return 0;
 }
 void System::SortBySensitivity(void) {
    // For each unknown, sum up the sensitivities in that column of the
    // Jacobian
    int i, j;
    for(j = 0; j < mat.n; j++) {
        double s = 0;
        int i;
        for(i = 0; i < mat.m; i++) {
            s += fabs(mat.A.num[i][j]);
        }
        mat.sens[j] = s;
    }
    for(j = 0; j < mat.n; j++) {
        mat.permutation[j] = j;
    }
    qsort(mat.permutation, mat.n, sizeof(mat.permutation[0]), BySensitivity);
    int origPos[MAX_UNKNOWNS];
    int entryWithOrigPos[MAX_UNKNOWNS];
    for(j = 0; j < mat.n; j++) {
        origPos[j] = j;
        entryWithOrigPos[j] = j;
    }
    for(j = 0; j < mat.n; j++) {
        int dest = j; // we are writing to position j
        // And the source is whichever position ahead of us can be swapped
        // in to make the permutation vectors line up.
        int src = entryWithOrigPos[mat.permutation[j]];
        for(i = 0; i < mat.m; i++) {
            SWAP(double, mat.A.num[i][src], mat.A.num[i][dest]);
            SWAP(Expr *, mat.A.sym[i][src], mat.A.sym[i][dest]);
        }
        SWAP(hParam, mat.param[src], mat.param[dest]);
        SWAP(int, origPos[src], origPos[dest]);
        if(mat.permutation[dest] != origPos[dest]) oops();
        // Update the table; only necessary to do this for src, since dest
        // is already done.
        entryWithOrigPos[origPos[src]] = src;
    }
 }
 bool System::Tol(double v) {
    return (fabs(v) < 0.01);
 }
-void System::GaussJordan(void) {
+int System::GaussJordan(void) {
    int i, j;
    for(j = 0; j < mat.n; j++) {
@ -219,6 +158,7 @@ void System::GaussJordan(void) {
    // Now eliminate.
    i = 0;
    int rank = 0;
    for(j = 0; j < mat.n; j++) {
        // First, seek a pivot in our column.
        int ip, imax;
@ -263,6 +203,7 @@ void System::GaussJordan(void) {
            // And mark this as a bound variable.
            mat.bound[j] = true;
            rank++;
            // Move on to the next row, since we just used this one to
            // eliminate from column j.
@ -270,24 +211,26 @@ void System::GaussJordan(void) {
            if(i >= mat.m) break;
        }
    }
    return rank;
 }
-bool System::SolveLinearSystem(void) {
+bool System::SolveLinearSystem(double X[], double A[][MAX_UNKNOWNS],
-    if(mat.m != mat.n) oops();
+                               double B[], int n)
 {
    // Gaussian elimination, with partial pivoting. It's an error if the
    // matrix is singular, because that means two constraints are
    // equivalent.
    int i, j, ip, jp, imax;
    double max, temp;
-    for(i = 0; i < mat.m; i++) {
+    for(i = 0; i < n; i++) {
        // We are trying eliminate the term in column i, for rows i+1 and
        // greater. First, find a pivot (between rows i and N-1).
        max = 0;
-        for(ip = i; ip < mat.m; ip++) {
+        for(ip = i; ip < n; ip++) {
-            if(fabs(mat.A.num[ip][i]) > max) {
+            if(fabs(A[ip][i]) > max) {
                imax = ip;
-                max = fabs(mat.A.num[ip][i]);
+                max = fabs(A[ip][i]);
            }
        }
        // Don't give up on a singular matrix unless it's really bad; the
@ -296,44 +239,67 @@ bool System::SolveLinearSystem(void) {
        if(fabs(max) < 1e-20) return false;
        // Swap row imax with row i
-        for(jp = 0; jp < mat.n; jp++) {
+        for(jp = 0; jp < n; jp++) {
-            temp = mat.A.num[i][jp];
+            SWAP(double, A[i][jp], A[imax][jp]);
            mat.A.num[i][jp] = mat.A.num[imax][jp];
            mat.A.num[imax][jp] = temp;
        }
-        temp = mat.B.num[i];
+        SWAP(double, B[i], B[imax]);
        mat.B.num[i] = mat.B.num[imax];
        mat.B.num[imax] = temp;
        // For rows i+1 and greater, eliminate the term in column i.
-        for(ip = i+1; ip < mat.m; ip++) {
+        for(ip = i+1; ip < n; ip++) {
-            temp = mat.A.num[ip][i]/mat.A.num[i][i];
+            temp = A[ip][i]/A[i][i];
-            for(jp = 0; jp < mat.n; jp++) {
+            for(jp = 0; jp < n; jp++) {
-                mat.A.num[ip][jp] -= temp*(mat.A.num[i][jp]);
+                A[ip][jp] -= temp*(A[i][jp]);
            }
-            mat.B.num[ip] -= temp*mat.B.num[i];
+            B[ip] -= temp*B[i];
        }
    }
    // We've put the matrix in upper triangular form, so at this point we
    // can solve by back-substitution.
-    for(i = mat.m - 1; i >= 0; i--) {
+    for(i = n - 1; i >= 0; i--) {
-        if(fabs(mat.A.num[i][i]) < 1e-20) return false;
+        if(fabs(A[i][i]) < 1e-20) return false;
-        temp = mat.B.num[i];
+        temp = B[i];
-        for(j = mat.n - 1; j > i; j--) {
+        for(j = n - 1; j > i; j--) {
-            temp -= mat.X[j]*mat.A.num[i][j];
+            temp -= X[j]*A[i][j];
        }
-        mat.X[i] = temp / mat.A.num[i][i];
+        X[i] = temp / A[i][i];
    }
    return true;
 }
 bool System::SolveLeastSquares(void) {
    int r, c, i;
    // Write A*A'
    for(r = 0; r < mat.m; r++) {
        for(c = 0; c < mat.m; c++) {  // yes, AAt is square
            double sum = 0;
            for(i = 0; i < mat.n; i++) {
                sum += mat.A.num[r][i]*mat.A.num[c][i];
            }
            mat.AAt[r][c] = sum;
        }
    }
    if(!SolveLinearSystem(mat.Z, mat.AAt, mat.B.num, mat.m)) return false;
    // And multiply that by A' to get our solution.
    for(c = 0; c < mat.n; c++) {
        double sum = 0;
        for(i = 0; i < mat.m; i++) {
            sum += mat.A.num[i][c]*mat.Z[i];
        }
        mat.X[c] = sum;
    }
    return true;
 }
 bool System::NewtonSolve(int tag) {
    WriteJacobian(tag, tag);
-    if(mat.m != mat.n) oops();
+    if(mat.m > mat.n) oops();
    int iter = 0;
    bool converged = false;
@ -347,11 +313,11 @@ bool System::NewtonSolve(int tag) {
        // And evaluate the Jacobian at our initial operating point.
        EvalJacobian();
-        if(!SolveLinearSystem()) break;
+        if(!SolveLeastSquares()) break;
        // Take the Newton step; 
        //      J(x_n) (x_{n+1} - x_n) = 0 - F(x_n)
-        for(i = 0; i < mat.m; i++) {
+        for(i = 0; i < mat.n; i++) {
            (param.FindById(mat.param[i]))->val -= mat.X[i];
        }
@ -399,8 +365,6 @@ bool System::Solve(void) {
    EvalJacobian();
    SortBySensitivity();
 /*
    for(i = 0; i < mat.m; i++) {
        dbp("function %d: %s", i, mat.B.sym[i]->Print());
@ -408,29 +372,17 @@ bool System::Solve(void) {
    dbp("m=%d", mat.m);
    for(i = 0; i < mat.m; i++) {
        for(j = 0; j < mat.n; j++) {
-            dbp("A[%d][%d] = %.3f", i, j, mat.A.num[i][j]);
+            dbp("A(%d,%d) = %.10f;", i+1, j+1, mat.A.num[i][j]);
        }
    } */
-    GaussJordan();
+    int rank = GaussJordan();
 /*    dbp("bound states:");
    for(j = 0; j < mat.n; j++) {
        dbp("  param %08x: %d", mat.param[j], mat.bound[j]);
    } */
    // Fix any still-free variables wherever they are now.
    for(j = mat.n-1; j >= 0; --j) {
        if(mat.bound[j]) continue;
        Param *p = param.FindByIdNoOops(mat.param[j]);
        if(!p) {
            // This is parameter does not occur in this group, so it's
            // not available to assume.
            continue;
        }
        p->tag = VAR_ASSUMED;
    }
    bool ok = NewtonSolve(0);
    if(ok) {