Click here to Skip to main content
15,886,199 members
Articles / Multimedia / DirectX

Rendering Text with Direct2D & DirectWrite

Rate me:
Please Sign up or sign in to vote.
4.94/5 (39 votes)
3 Jan 2015CPOL8 min read 105.9K   2.8K   76  
Direct2D, DirectWrite, Windows API, C++, std::shared_ptr and more
#include "stdafx.h"

/*
* -- SuperLU routine (version 3.0) --
* Univ. of California Berkeley, Xerox Palo Alto Research Center,
* and Lawrence Berkeley National Lab.
* October 15, 2003
*
*/
/*
* File name:		dsp_blas2.c
* Purpose:		Sparse BLAS 2, using some dense BLAS 2 operations.
*/

#include "hnum_pdsp_defs.h"


namespace harlinn
{
    namespace numerics
    {
        namespace SuperLU
        {
            namespace Double
            {

                int
                    sp_dtrsv(char *uplo, char *trans, char *diag, SuperMatrix *L, 
                    SuperMatrix *U, double *x, int *info)
                {
                    /*
                    *   Purpose
                    *   =======
                    *
                    *   sp_dtrsv() solves one of the systems of equations   
                    *       A*x = b,   or   A'*x = b,
                    *   where b and x are n element vectors and A is a sparse unit , or   
                    *   non-unit, upper or lower triangular matrix.   
                    *   No test for singularity or near-singularity is included in this   
                    *   routine. Such tests must be performed before calling this routine.   
                    *
                    *   Parameters   
                    *   ==========   
                    *
                    *   uplo   - (input) char*
                    *            On entry, uplo specifies whether the matrix is an upper or   
                    *             lower triangular matrix as follows:   
                    *                uplo = 'U' or 'u'   A is an upper triangular matrix.   
                    *                uplo = 'L' or 'l'   A is a lower triangular matrix.   
                    *
                    *   trans  - (input) char*
                    *             On entry, trans specifies the equations to be solved as   
                    *             follows:   
                    *                trans = 'N' or 'n'   A*x = b.   
                    *                trans = 'T' or 't'   A'*x = b.
                    *                trans = 'C' or 'c'   A'*x = b.   
                    *
                    *   diag   - (input) char*
                    *             On entry, diag specifies whether or not A is unit   
                    *             triangular as follows:   
                    *                diag = 'U' or 'u'   A is assumed to be unit triangular.   
                    *                diag = 'N' or 'n'   A is not assumed to be unit   
                    *                                    triangular.   
                    *	     
                    *   L       - (input) SuperMatrix*
                    *	       The factor L from the factorization Pr*A*Pc=L*U. Use
                    *             compressed row subscripts storage for supernodes,
                    *             i.e., L has types: Stype = SC, Dtype = _D, Mtype = TRLU.
                    *
                    *   U       - (input) SuperMatrix*
                    *	        The factor U from the factorization Pr*A*Pc=L*U.
                    *	        U has types: Stype = NCP, Dtype = _D, Mtype = TRU.
                    *    
                    *   x       - (input/output) double*
                    *             Before entry, the incremented array X must contain the n   
                    *             element right-hand side vector b. On exit, X is overwritten 
                    *             with the solution vector x.
                    *
                    *   info    - (output) int*
                    *             If *info = -i, the i-th argument had an illegal value.
                    *
                    */
#if ( MACH==CRAY_PVP )
                    _fcd ftcs1, ftcs2, ftcs3;
#endif
                    SCPformat *Lstore;
                    NCPformat *Ustore;
                    double   *Lval, *Uval;
                    int incx = 1, incy = 1;
                    double alpha = 1.0, beta = 1.0;
                    register int fsupc, luptr, istart, irow, k, iptr, jcol, nsuper;
                    int          nsupr, nsupc, nrow, i;
                    double *work;
                    flops_t solve_ops;

                    /* Test the input parameters */
                    *info = 0;
                    if ( !lsame_(uplo,"L") && !lsame_(uplo, "U") ) *info = -1;
                    else if ( !lsame_(trans, "N") && !lsame_(trans, "T") ) *info = -2;
                    else if ( !lsame_(diag, "U") && !lsame_(diag, "N") ) *info = -3;
                    else if ( L->nrow != L->ncol || L->nrow < 0 ) *info = -4;
                    else if ( U->nrow != U->ncol || U->nrow < 0 ) *info = -5;
                    if ( *info ) {
                        i = -(*info);
                        xerbla_("sp_dtrsv", &i);
                        return 0;
                    }

                    Lstore = (SCPformat*) L->Store;
                    Lval = (double*) Lstore->nzval;
                    Ustore = (NCPformat*) U->Store;
                    Uval = (double*) Ustore->nzval;
                    nsuper = Lstore->nsuper;
                    solve_ops = 0;

                    if ( !(work = doubleCalloc(L->nrow)) )
                        SUPERLU_ABORT("Malloc fails for work in sp_dtrsv().");

                    if ( lsame_(trans, "N") ) {	/* Form x := inv(A)*x. */

                        if ( lsame_(uplo, "L") ) {
                            /* Form x := inv(L)*x */
                            if ( L->nrow == 0 ) return 0; /* Quick return */

                            for (k = 0; k <= nsuper; k++) {
                                fsupc = L_FST_SUPC(k);
                                istart = L_SUB_START(fsupc);
                                nsupr = L_SUB_END(fsupc) - istart;
                                nsupc = L_LAST_SUPC(k) - fsupc;
                                luptr = L_NZ_START(fsupc);
                                nrow = nsupr - nsupc;

                                solve_ops += nsupc * (nsupc - 1);
                                solve_ops += 2 * nrow * nsupc;

                                if ( nsupc == 1 ) {
                                    for (iptr=istart+1; iptr < L_SUB_END(fsupc); ++iptr) {
                                        irow = L_SUB(iptr);
                                        ++luptr;
                                        x[irow] -= x[fsupc] * Lval[luptr];
                                    }
                                } else {
#ifdef USE_VENDOR_BLAS
#if ( MACH==CRAY_PVP )
                                    ftcs1 = _cptofcd("L", strlen("L"));
                                    ftcs2 = _cptofcd("N", strlen("N"));
                                    ftcs3 = _cptofcd("U", strlen("U"));

                                    STRSV(ftcs1, ftcs2, ftcs3, &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);

                                    SGEMV(ftcs2, &nrow, &nsupc, &alpha, &Lval[luptr+nsupc], 
                                        &nsupr, &x[fsupc], &incx, &beta, &work[0], &incy);
#else
                                    dtrsv_("L", "N", "U", &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);

                                    dgemv_("N", &nrow, &nsupc, &alpha, &Lval[luptr+nsupc], 
                                        &nsupr, &x[fsupc], &incx, &beta, &work[0], &incy);
#endif
#else
                                    dlsolve (nsupr, nsupc, &Lval[luptr], &x[fsupc]);

                                    dmatvec (nsupr, nsupr-nsupc, nsupc, &Lval[luptr+nsupc],
                                        &x[fsupc], &work[0] );
#endif		

                                    iptr = istart + nsupc;
                                    for (i = 0; i < nrow; ++i, ++iptr) {
                                        irow = L_SUB(iptr);
                                        x[irow] -= work[i];	/* Scatter */
                                        work[i] = 0.0;

                                    }
                                }
                            } /* for k ... */

                        } else {
                            /* Form x := inv(U)*x */

                            if ( U->nrow == 0 ) return 0; /* Quick return */

                            for (k = nsuper; k >= 0; k--) {
                                fsupc = L_FST_SUPC(k);
                                nsupr = L_SUB_END(fsupc) - L_SUB_START(fsupc);
                                nsupc = L_LAST_SUPC(k) - fsupc;
                                luptr = L_NZ_START(fsupc);

                                solve_ops += nsupc * (nsupc + 1);

                                if ( nsupc == 1 ) {
                                    x[fsupc] /= Lval[luptr];
                                    for (i = U_NZ_START(fsupc); i < U_NZ_END(fsupc); ++i) {
                                        irow = U_SUB(i);
                                        x[irow] -= x[fsupc] * Uval[i];
                                    }
                                } else {
#ifdef USE_VENDOR_BLAS
#if ( MACH==CRAY_PVP )
                                    ftcs1 = _cptofcd("U", strlen("U"));
                                    ftcs2 = _cptofcd("N", strlen("N"));
                                    ftcs3 = _cptofcd("N", strlen("N"));

                                    STRSV(ftcs1, ftcs2, ftcs3, &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);
#else
                                    dtrsv_("U", "N", "N", &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);
#endif
#else		
                                    dusolve ( nsupr, nsupc, &Lval[luptr], &x[fsupc] );
#endif		

                                    for (jcol = fsupc; jcol < fsupc + nsupc; jcol++) {
                                        solve_ops += 2*(U_NZ_END(jcol) - U_NZ_START(jcol));
                                        for (i = U_NZ_START(jcol); i < U_NZ_END(jcol); i++) {
                                            irow = U_SUB(i);
                                            x[irow] -= x[jcol] * Uval[i];
                                        }
                                    }
                                }
                            } /* for k ... */

                        }
                    } else { /* Form x := inv(A')*x */

                        if ( lsame_(uplo, "L") ) {
                            /* Form x := inv(L')*x */
                            if ( L->nrow == 0 ) return 0; /* Quick return */

                            for (k = nsuper; k >= 0; --k) {
                                fsupc = L_FST_SUPC(k);
                                istart = L_SUB_START(fsupc);
                                nsupr = L_SUB_END(fsupc) - istart;
                                nsupc = L_LAST_SUPC(k) - fsupc;
                                luptr = L_NZ_START(fsupc);

                                solve_ops += 2 * (nsupr - nsupc) * nsupc;

                                for (jcol = fsupc; jcol < L_LAST_SUPC(k); jcol++) {
                                    iptr = istart + nsupc;
                                    for (i = L_NZ_START(jcol) + nsupc; 
                                        i < L_NZ_END(jcol); i++) {
                                            irow = L_SUB(iptr);
                                            x[jcol] -= x[irow] * Lval[i];
                                            iptr++;
                                    }
                                }

                                if ( nsupc > 1 ) {
                                    solve_ops += nsupc * (nsupc - 1);
#ifdef _CRAY
                                    ftcs1 = _cptofcd("L", strlen("L"));
                                    ftcs2 = _cptofcd("T", strlen("T"));
                                    ftcs3 = _cptofcd("U", strlen("U"));
                                    STRSV(ftcs1, ftcs2, ftcs3, &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);
#else
                                    dtrsv_("L", "T", "U", &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);
#endif
                                }
                            }
                        } else {
                            /* Form x := inv(U')*x */
                            if ( U->nrow == 0 ) return 0; /* Quick return */

                            for (k = 0; k <= nsuper; k++) {
                                fsupc = L_FST_SUPC(k);
                                nsupr = L_SUB_END(fsupc) - L_SUB_START(fsupc);
                                nsupc = L_LAST_SUPC(k) - fsupc;
                                luptr = L_NZ_START(fsupc);

                                for (jcol = fsupc; jcol < fsupc + nsupc; jcol++) {
                                    solve_ops += 2*(U_NZ_END(jcol) - U_NZ_START(jcol));
                                    for (i = U_NZ_START(jcol); i < U_NZ_END(jcol); i++) {
                                        irow = U_SUB(i);
                                        x[jcol] -= x[irow] * Uval[i];
                                    }
                                }

                                solve_ops += nsupc * (nsupc + 1);

                                if ( nsupc == 1 ) {
                                    x[fsupc] /= Lval[luptr];
                                } else {
#ifdef _CRAY
                                    ftcs1 = _cptofcd("U", strlen("U"));
                                    ftcs2 = _cptofcd("T", strlen("T"));
                                    ftcs3 = _cptofcd("N", strlen("N"));
                                    STRSV( ftcs1, ftcs2, ftcs3, &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);
#else
                                    dtrsv_("U", "T", "N", &nsupc, &Lval[luptr], &nsupr,
                                        &x[fsupc], &incx);
#endif
                                }
                            } /* for k ... */
                        }
                    }

                    SUPERLU_FREE(work);
                    return 0;
                }




                int
                    sp_dgemv(char *trans, double alpha, SuperMatrix *A, double *x, 
                    int incx, double beta, double *y, int incy)
                {
                    /*  Purpose   
                    =======   

                    sp_dgemv()  performs one of the matrix-vector operations   
                    y := alpha*A*x + beta*y,   or   y := alpha*A'*x + beta*y,   
                    where alpha and beta are scalars, x and y are vectors and A is a
                    sparse A->nrow by A->ncol matrix.   

                    Parameters   
                    ==========   

                    TRANS  - (input) char*
                    On entry, TRANS specifies the operation to be performed as   
                    follows:   
                    TRANS = 'N' or 'n'   y := alpha*A*x + beta*y.   
                    TRANS = 'T' or 't'   y := alpha*A'*x + beta*y.   
                    TRANS = 'C' or 'c'   y := alpha*A'*x + beta*y.   

                    ALPHA  - (input) double
                    On entry, ALPHA specifies the scalar alpha.   

                    A      - (input) SuperMatrix*
                    Matrix A with a sparse format, of dimension (A->nrow, A->ncol).
                    Currently, the type of A can be:
                    Stype = NC or NCP; Dtype = SLU_D; Mtype = GE. 
                    In the future, more general A can be handled.

                    X      - (input) double*, array of DIMENSION at least   
                    ( 1 + ( n - 1 )*abs( INCX ) ) when TRANS = 'N' or 'n'   
                    and at least   
                    ( 1 + ( m - 1 )*abs( INCX ) ) otherwise.   
                    Before entry, the incremented array X must contain the   
                    vector x.   

                    INCX   - (input) int
                    On entry, INCX specifies the increment for the elements of   
                    X. INCX must not be zero.   

                    BETA   - (input) double
                    On entry, BETA specifies the scalar beta. When BETA is   
                    supplied as zero then Y need not be set on input.   

                    Y      - (output) double*,  array of DIMENSION at least   
                    ( 1 + ( m - 1 )*abs( INCY ) ) when TRANS = 'N' or 'n'   
                    and at least   
                    ( 1 + ( n - 1 )*abs( INCY ) ) otherwise.   
                    Before entry with BETA non-zero, the incremented array Y   
                    must contain the vector y. On exit, Y is overwritten by the 
                    updated vector y.

                    INCY   - (input) int
                    On entry, INCY specifies the increment for the elements of   
                    Y. INCY must not be zero.   

                    ==== Sparse Level 2 Blas routine.   
                    */

                    /* Local variables */
                    NCformat *Astore;
                    double   *Aval;
                    int info;
                    double temp;
                    int lenx, leny, i, j, irow;
                    int iy, jx, jy, kx, ky;
                    int notran;

                    notran = lsame_(trans, "N");
                    Astore = (NCformat *)A->Store;
                    Aval = (double *)Astore->nzval;

                    /* Test the input parameters */
                    info = 0;
                    if ( !notran && !lsame_(trans, "T") && !lsame_(trans, "C")) info = 1;
                    else if ( A->nrow < 0 || A->ncol < 0 ) info = 3;
                    else if (incx == 0) info = 5;
                    else if (incy == 0)	info = 8;
                    if (info != 0) {
                        xerbla_("sp_dgemv ", &info);
                        return 0;
                    }

                    /* Quick return if possible. */
                    if (A->nrow == 0 || A->ncol == 0 || (alpha == 0. && beta == 1.))
                        return 0;

                    /* Set  LENX  and  LENY, the lengths of the vectors x and y, and set 
                    up the start points in  X  and  Y. */
                    if (lsame_(trans, "N")) {
                        lenx = A->ncol;
                        leny = A->nrow;
                    } else {
                        lenx = A->nrow;
                        leny = A->ncol;
                    }
                    if (incx > 0) kx = 0;
                    else kx =  - (lenx - 1) * incx;
                    if (incy > 0) ky = 0;
                    else ky =  - (leny - 1) * incy;

                    /* Start the operations. In this version the elements of A are   
                    accessed sequentially with one pass through A. */
                    /* First form  y := beta*y. */
                    if (beta != 1.) {
                        if (incy == 1) {
                            if (beta == 0.)
                                for (i = 0; i < leny; ++i) y[i] = 0.;
                            else
                                for (i = 0; i < leny; ++i) y[i] = beta * y[i];
                        } else {
                            iy = ky;
                            if (beta == 0.)
                                for (i = 0; i < leny; ++i) {
                                    y[iy] = 0.;
                                    iy += incy;
                                }
                            else
                                for (i = 0; i < leny; ++i) {
                                    y[iy] = beta * y[iy];
                                    iy += incy;
                                }
                        }
                    }

                    if (alpha == 0.) return 0;

                    if ( notran ) {
                        /* Form  y := alpha*A*x + y. */
                        jx = kx;
                        if (incy == 1) {
                            for (j = 0; j < A->ncol; ++j) {
                                if (x[jx] != 0.) {
                                    temp = alpha * x[jx];
                                    for (i = Astore->colptr[j]; i < Astore->colptr[j+1]; ++i) {
                                        irow = Astore->rowind[i];
                                        y[irow] += temp * Aval[i];
                                    }
                                }
                                jx += incx;
                            }
                        } else {
                            SUPERLU_ABORT("Not implemented.");
                        }
                    } else {
                        /* Form  y := alpha*A'*x + y. */
                        jy = ky;
                        if (incx == 1) {
                            for (j = 0; j < A->ncol; ++j) {
                                temp = 0.;
                                for (i = Astore->colptr[j]; i < Astore->colptr[j+1]; ++i) {
                                    irow = Astore->rowind[i];
                                    temp += Aval[i] * x[irow];
                                }
                                y[jy] += alpha * temp;
                                jy += incy;
                            }
                        } else {
                            SUPERLU_ABORT("Not implemented.");
                        }
                    }
                    return 0;
                } /* sp_dgemv */

            };
        };
    };
};



By viewing downloads associated with this article you agree to the Terms of Service and the article's licence.

If a file you wish to view isn't highlighted, and is a text file (not binary), please let us know and we'll add colourisation support for it.

License

This article, along with any associated source code and files, is licensed under The Code Project Open License (CPOL)


Written By
Architect Sea Surveillance AS
Norway Norway
Chief Architect - Sea Surveillance AS.

Specializing in integrated operations and high performance computing solutions.

I’ve been fooling around with computers since the early eighties, I’ve even done work on CP/M and MP/M.

Wrote my first “real” program on a BBC micro model B based on a series in a magazine at that time. It was fun and I got hooked on this thing called programming ...

A few Highlights:

  • High performance application server development
  • Model Driven Architecture and Code generators
  • Real-Time Distributed Solutions
  • C, C++, C#, Java, TSQL, PL/SQL, Delphi, ActionScript, Perl, Rexx
  • Microsoft SQL Server, Oracle RDBMS, IBM DB2, PostGreSQL
  • AMQP, Apache qpid, RabbitMQ, Microsoft Message Queuing, IBM WebSphereMQ, Oracle TuxidoMQ
  • Oracle WebLogic, IBM WebSphere
  • Corba, COM, DCE, WCF
  • AspenTech InfoPlus.21(IP21), OsiSoft PI


More information about what I do for a living can be found at: harlinn.com or LinkedIn

You can contact me at espen@harlinn.no

Comments and Discussions