1
       2
       3
       4
       5
       6
       7
       8
       9
      10
      11
      12
      13
      14
      15
      16
      17
      18
      19
      20
      21
      22
      23
      24
      25
      26
      27
      28
      29
      30
      31
      32
      33
      34
      35
      36
      37
      38
      39
      40
      41
      42
      43
      44
      45
      46
      47
      48
      49
      50
      51
      52
      53
      54
      55
      56
      57
      58
      59
      60
      61
      62
      63
      64
      65
      66
      67
      68
      69
      70
      71
      72
      73
      74
      75
      76
      77
      78
      79
      80
      81
      82
      83
      84
      85
      86
      87
      88
      89
      90
      91
      92
      93
      94
      95
      96
      97
      98
      99
     100
     101
     102
     103
     104
     105
     106
     107
     108
     109
#include <stdio.h>
#include <stdlib.h>
#include <stddef.h>

void
printDGeMatrix(size_t m, size_t n,
               const double *A,
               ptrdiff_t incRowA, ptrdiff_t incColA)
{
    for (size_t i=0; i<m; ++i) {
        for (size_t j=0; j<n; ++j) {
            printf("%9.2lf ", A[i*incRowA + j*incColA]);
        }
        printf("\n");
    }
    printf("\n");
}

void
dscal(size_t n,
      double alpha,
      double *x, ptrdiff_t incX)
{
    if (alpha==1) {
        return;
    }
    if (alpha!=0) {
        for (size_t i=0; i<n; ++i) {
            x[i*incX] *= alpha;
        }
    } else {
        for (size_t i=0; i<n; ++i) {
            x[i*incX] = 0;
        }
    }
}

void
dger(size_t m, size_t n,
     double alpha,
     const double *x, ptrdiff_t incX,
     const double *y, ptrdiff_t incY,
     double *A, ptrdiff_t incRowA, ptrdiff_t incColA)
{
    if (alpha==0 || m==0 || n==0) {
        return;
    }

    if (incRowA>incColA) {
        dger(n, m, alpha, y, incY, x, incX, A, incColA, incRowA);
        return;
    }

    for (size_t j=0; j<n; ++j) {
        for (size_t i=0; i<m; ++i) {
            A[i*incRowA+j*incColA] += alpha*x[i*incX]*y[j*incY];
        }
    }
}

int
main()
{
    size_t m = 3;
    size_t n = 4;
    ptrdiff_t incRowA = 1;
    ptrdiff_t incColA = m;

    double *A = malloc(m*n*sizeof(double));
    if (!A) {
        abort();
    }

    A[0*incRowA + 0*incColA] = 2;
    A[0*incRowA + 1*incColA] = 1;
    A[0*incRowA + 2*incColA] = 3;
    A[0*incRowA + 3*incColA] = 1;

    A[1*incRowA + 0*incColA] = 4;
    A[1*incRowA + 1*incColA] = 5;
    A[1*incRowA + 2*incColA] = 6;
    A[1*incRowA + 3*incColA] = 2;

    A[2*incRowA + 0*incColA] = 8;
    A[2*incRowA + 1*incColA] = 8;
    A[2*incRowA + 2*incColA] = 9;
    A[2*incRowA + 3*incColA] = 3;

    printf("A =\n");
    printDGeMatrix(m, n, A, incRowA, incColA);

    // compute LU
    size_t k = m<n ? m : n;

    for (size_t j=0; j<k; ++j) {
        double alpha = 1/A[j*incRowA + j*incColA];

        dscal(m-1-j, alpha, &A[(j+1)*incRowA + j*incColA], incRowA);
        dger(m-1-j, n-1-j, -1,
             &A[(j+1)*incRowA +  j   *incColA], incRowA,
             &A[ j   *incRowA + (j+1)*incColA], incColA,
             &A[(j+1)*incRowA + (j+1)*incColA], incRowA, incColA);
    }

    printf("A =\n");
    printDGeMatrix(m, n, A, incRowA, incColA);

    free(A);
}