FLA_Chol_u.h File Reference

(r)

Go to the source code of this file.

Functions

FLA_Error FLA_Chol_u_blk_var1 (FLA_Obj A, fla_chol_t *cntl)
FLA_Error FLA_Chol_u_blk_var2 (FLA_Obj A, fla_chol_t *cntl)
FLA_Error FLA_Chol_u_blk_var3 (FLA_Obj A, fla_chol_t *cntl)
FLA_Error FLA_Chol_u_unb_var1 (FLA_Obj A)
FLA_Error FLA_Chol_u_unb_var2 (FLA_Obj A)
FLA_Error FLA_Chol_u_unb_var3 (FLA_Obj A)


Function Documentation

FLA_Error FLA_Chol_u_blk_var1 ( FLA_Obj  A,
fla_chol_t cntl 
)

References FLA_Chol_internal(), FLA_Cont_with_3x3_to_2x2(), FLA_Determine_blocksize(), FLA_Herk_internal(), FLA_MINUS_ONE, FLA_Obj_is_real(), FLA_Obj_length(), FLA_ONE, FLA_Part_2x2(), FLA_Repart_2x2_to_3x3(), FLA_Syrk_internal(), and FLA_Trsm_internal().

Referenced by FLA_Chol_u().

00038 {
00039   FLA_Obj ATL,   ATR,      A00, A01, A02,
00040           ABL,   ABR,      A10, A11, A12,
00041                            A20, A21, A22;
00042 
00043   dim_t b;
00044 
00045   int value = 0;
00046 
00047   FLA_Part_2x2( A,    &ATL, &ATR,
00048                       &ABL, &ABR,     0, 0, FLA_TL );
00049 
00050   while ( FLA_Obj_length( ATL ) < FLA_Obj_length( A ) ){
00051 
00052     b = FLA_Determine_blocksize( ABR, FLA_BR, FLA_Cntl_blocksize( cntl ) );
00053 
00054     FLA_Repart_2x2_to_3x3( ATL, /**/ ATR,       &A00, /**/ &A01, &A02,
00055                         /* ************* */   /* ******************** */
00056                                                 &A10, /**/ &A11, &A12,
00057                            ABL, /**/ ABR,       &A20, /**/ &A21, &A22,
00058                            b, b, FLA_BR );
00059 
00060     /*------------------------------------------------------------*/
00061 
00062     if ( FLA_Obj_is_real( A ) )
00063     {
00064       /* A01 = inv( triu( A00 )' ) * A01; */
00065       FLA_Trsm_internal( FLA_LEFT, FLA_UPPER_TRIANGULAR,
00066                          FLA_TRANSPOSE, FLA_NONUNIT_DIAG,
00067                          FLA_ONE, A00, A01,
00068                          FLA_Cntl_sub_trsm( cntl ) );
00069 
00070       /* A11 = A11 - A01' * A01; */
00071       FLA_Syrk_internal( FLA_UPPER_TRIANGULAR, FLA_TRANSPOSE,
00072                          FLA_MINUS_ONE, A01, FLA_ONE, A11,
00073                          FLA_Cntl_sub_syrk( cntl ) );
00074 
00075       /* A11 = chol( A11 ); */
00076       value = FLA_Chol_internal( FLA_UPPER_TRIANGULAR, A11,
00077                                  FLA_Cntl_sub_chol( cntl ) );
00078 
00079       if ( value != FLA_SUCCESS )
00080         return ( FLA_Obj_length( A00 ) + value );
00081     }
00082     else
00083     {
00084       /* A01 = inv( triu( A00 )' ) * A01; */
00085       FLA_Trsm_internal( FLA_LEFT, FLA_UPPER_TRIANGULAR,
00086                          FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG,
00087                          FLA_ONE, A00, A01,
00088                          FLA_Cntl_sub_trsm( cntl ) );
00089 
00090       /* A11 = A11 - A01' * A01; */
00091       FLA_Herk_internal( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE,
00092                          FLA_MINUS_ONE, A01, FLA_ONE, A11,
00093                          FLA_Cntl_sub_herk( cntl ) );
00094 
00095       /* A11 = chol( A11 ); */
00096       value = FLA_Chol_internal( FLA_UPPER_TRIANGULAR, A11,
00097                                  FLA_Cntl_sub_chol( cntl ) );
00098 
00099       if ( value != FLA_SUCCESS )
00100         return ( FLA_Obj_length( A00 ) + value );
00101     }
00102 
00103     /*------------------------------------------------------------*/
00104 
00105     FLA_Cont_with_3x3_to_2x2( &ATL, /**/ &ATR,       A00, A01, /**/ A02,
00106                                                      A10, A11, /**/ A12,
00107                             /* ************** */  /* ****************** */
00108                               &ABL, /**/ &ABR,       A20, A21, /**/ A22,
00109                               FLA_TL );
00110   }
00111 
00112   return value;
00113 }

FLA_Error FLA_Chol_u_blk_var2 ( FLA_Obj  A,
fla_chol_t cntl 
)

References FLA_Chol_internal(), FLA_Cont_with_3x3_to_2x2(), FLA_Determine_blocksize(), FLA_Gemm_internal(), FLA_Herk_internal(), FLA_MINUS_ONE, FLA_Obj_is_real(), FLA_Obj_length(), FLA_ONE, FLA_Part_2x2(), FLA_Repart_2x2_to_3x3(), FLA_Syrk_internal(), and FLA_Trsm_internal().

Referenced by FLA_Chol_u().

00038 {
00039   FLA_Obj ATL,   ATR,      A00, A01, A02,
00040           ABL,   ABR,      A10, A11, A12,
00041                            A20, A21, A22;
00042 
00043   dim_t b;
00044 
00045   int value = 0;
00046 
00047   FLA_Part_2x2( A,    &ATL, &ATR,
00048                       &ABL, &ABR,     0, 0, FLA_TL );
00049 
00050   while ( FLA_Obj_length( ATL ) < FLA_Obj_length( A ) ){
00051 
00052     b = FLA_Determine_blocksize( ABR, FLA_BR, FLA_Cntl_blocksize( cntl ) );
00053 
00054     FLA_Repart_2x2_to_3x3( ATL, /**/ ATR,       &A00, /**/ &A01, &A02,
00055                         /* ************* */   /* ******************** */
00056                                                 &A10, /**/ &A11, &A12,
00057                            ABL, /**/ ABR,       &A20, /**/ &A21, &A22,
00058                            b, b, FLA_BR );
00059 
00060     /*------------------------------------------------------------*/
00061 
00062     if ( FLA_Obj_is_real( A ) )
00063     {
00064       /* A11 = A11 - A01' * A01; */
00065       FLA_Syrk_internal( FLA_UPPER_TRIANGULAR, FLA_TRANSPOSE,
00066                          FLA_MINUS_ONE, A01, FLA_ONE, A11,
00067                          FLA_Cntl_sub_syrk( cntl ) );
00068 
00069       /* A12 = A12 - A01' * A02; */
00070       FLA_Gemm_internal( FLA_TRANSPOSE, FLA_NO_TRANSPOSE,
00071                          FLA_MINUS_ONE, A01, A02, FLA_ONE, A12,
00072                          FLA_Cntl_sub_gemm( cntl ) );
00073 
00074       /* A11 = chol( A11 ); */
00075       value = FLA_Chol_internal( FLA_UPPER_TRIANGULAR, A11,
00076                                  FLA_Cntl_sub_chol( cntl ) );
00077 
00078       if ( value != FLA_SUCCESS )
00079         return ( FLA_Obj_length( A00 ) + value );
00080 
00081       /* A12 = inv( triu( A11 )' ) * A12; */
00082       FLA_Trsm_internal( FLA_LEFT, FLA_UPPER_TRIANGULAR,
00083                          FLA_TRANSPOSE, FLA_NONUNIT_DIAG,
00084                          FLA_ONE, A11, A12,
00085                          FLA_Cntl_sub_trsm( cntl ) );
00086     }
00087     else
00088     {
00089       /* A11 = A11 - A01' * A01; */
00090       FLA_Herk_internal( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE,
00091                          FLA_MINUS_ONE, A01, FLA_ONE, A11,
00092                          FLA_Cntl_sub_herk( cntl ) );
00093 
00094       /* A12 = A12 - A02' * A01; */
00095       FLA_Gemm_internal( FLA_CONJ_TRANSPOSE, FLA_NO_TRANSPOSE,
00096                          FLA_MINUS_ONE, A01, A02, FLA_ONE, A12,
00097                          FLA_Cntl_sub_gemm( cntl ) );
00098 
00099       /* A11 = chol( A11 ); */
00100       value = FLA_Chol_internal( FLA_UPPER_TRIANGULAR, A11,
00101                                  FLA_Cntl_sub_chol( cntl ) );
00102 
00103       if ( value != FLA_SUCCESS )
00104         return ( FLA_Obj_length( A00 ) + value );
00105 
00106       /* A12 = inv( triu( A11 )' ) * A12; */
00107       FLA_Trsm_internal( FLA_LEFT, FLA_UPPER_TRIANGULAR,
00108                          FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG,
00109                          FLA_ONE, A11, A12,
00110                          FLA_Cntl_sub_trsm( cntl ) );
00111     }
00112 
00113     /*------------------------------------------------------------*/
00114 
00115     FLA_Cont_with_3x3_to_2x2( &ATL, /**/ &ATR,       A00, A01, /**/ A02,
00116                                                      A10, A11, /**/ A12,
00117                             /* ************** */  /* ****************** */
00118                               &ABL, /**/ &ABR,       A20, A21, /**/ A22,
00119                               FLA_TL );
00120   }
00121 
00122   return value;
00123 }

FLA_Error FLA_Chol_u_blk_var3 ( FLA_Obj  A,
fla_chol_t cntl 
)

References FLA_Chol_internal(), FLA_Cont_with_3x3_to_2x2(), FLA_Determine_blocksize(), FLA_Herk_internal(), FLA_MINUS_ONE, FLA_Obj_is_real(), FLA_Obj_length(), FLA_ONE, FLA_Part_2x2(), FLA_Repart_2x2_to_3x3(), FLA_Syrk_internal(), and FLA_Trsm_internal().

Referenced by FLA_Chol_u().

00036 {
00037   FLA_Obj ATL,   ATR,      A00, A01, A02,
00038           ABL,   ABR,      A10, A11, A12,
00039                            A20, A21, A22;
00040 
00041   dim_t b;
00042 
00043   int value = 0;
00044 
00045   FLA_Part_2x2( A,    &ATL, &ATR,
00046                       &ABL, &ABR,     0, 0, FLA_TL );
00047 
00048   while ( FLA_Obj_length( ATL ) < FLA_Obj_length( A ) ){
00049 
00050     b = FLA_Determine_blocksize( ABR, FLA_BR, FLA_Cntl_blocksize( cntl ) );
00051 
00052     FLA_Repart_2x2_to_3x3( ATL, /**/ ATR,       &A00, /**/ &A01, &A02,
00053                         /* ************* */   /* ******************** */
00054                                                 &A10, /**/ &A11, &A12,
00055                            ABL, /**/ ABR,       &A20, /**/ &A21, &A22,
00056                            b, b, FLA_BR );
00057 
00058     /*------------------------------------------------------------*/
00059 
00060     if ( FLA_Obj_is_real( A ) )
00061     {
00062       /* A11 = chol( A11 ); */
00063       value = FLA_Chol_internal( FLA_UPPER_TRIANGULAR, A11,
00064                                  FLA_Cntl_sub_chol( cntl ) );
00065 
00066       if ( value != FLA_SUCCESS )
00067         return ( FLA_Obj_length( A00 ) + value );
00068 
00069       /* A12 = inv( triu( A11 )' ) * A12; */
00070       FLA_Trsm_internal( FLA_LEFT, FLA_UPPER_TRIANGULAR,
00071                          FLA_TRANSPOSE, FLA_NONUNIT_DIAG,
00072                          FLA_ONE, A11, A12,
00073                          FLA_Cntl_sub_trsm( cntl ) );
00074 
00075       /* A22 = A22 - A12' * A12; */
00076       FLA_Syrk_internal( FLA_UPPER_TRIANGULAR, FLA_TRANSPOSE,
00077                          FLA_MINUS_ONE, A12, FLA_ONE, A22,
00078                          FLA_Cntl_sub_syrk( cntl ) );
00079     }
00080     else
00081     {
00082       /* A11 = chol( A11 ); */
00083       value = FLA_Chol_internal( FLA_UPPER_TRIANGULAR, A11,
00084                                  FLA_Cntl_sub_chol( cntl ) );
00085 
00086       if ( value != FLA_SUCCESS )
00087         return ( FLA_Obj_length( A00 ) + value );
00088 
00089       /* A12 = inv( triu( A11 )' ) * A12; */
00090       FLA_Trsm_internal( FLA_LEFT, FLA_UPPER_TRIANGULAR,
00091                          FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG,
00092                          FLA_ONE, A11, A12,
00093                          FLA_Cntl_sub_trsm( cntl ) );
00094 
00095       /* A22 = A22 - A12' * A12; */
00096       FLA_Herk_internal( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE,
00097                          FLA_MINUS_ONE, A12, FLA_ONE, A22,
00098                          FLA_Cntl_sub_herk( cntl ) );
00099     }
00100 
00101     /*------------------------------------------------------------*/
00102 
00103     FLA_Cont_with_3x3_to_2x2( &ATL, /**/ &ATR,       A00, A01, /**/ A02,
00104                                                      A10, A11, /**/ A12,
00105                             /* ************** */  /* ****************** */
00106                               &ABL, /**/ &ABR,       A20, A21, /**/ A22,
00107                               FLA_TL );
00108   }
00109 
00110   return value;
00111 }

FLA_Error FLA_Chol_u_unb_var1 ( FLA_Obj  A  ) 

References FLA_Cont_with_3x3_to_2x2(), FLA_Dotcs_external(), FLA_Dots_external(), FLA_MINUS_ONE, FLA_Obj_is_real(), FLA_Obj_length(), FLA_ONE, FLA_Part_2x2(), FLA_Repart_2x2_to_3x3(), FLA_Sqrt(), and FLA_Trsv_external().

00038 {
00039   FLA_Obj ATL,   ATR,      A00,  a01,     A02,
00040           ABL,   ABR,      a10t, alpha11, a12t,
00041                            A20,  a21,     A22;
00042 
00043   int value = 0;
00044 
00045   FLA_Part_2x2( A,    &ATL, &ATR,
00046                       &ABL, &ABR,     0, 0, FLA_TL );
00047 
00048   while ( FLA_Obj_length( ATL ) < FLA_Obj_length( A ) ){
00049 
00050     FLA_Repart_2x2_to_3x3( ATL, /**/ ATR,       &A00,  /**/ &a01,     &A02,
00051                         /* ************* */   /* ************************** */
00052                                                 &a10t, /**/ &alpha11, &a12t,
00053                            ABL, /**/ ABR,       &A20,  /**/ &a21,     &A22,
00054                            1, 1, FLA_BR );
00055 
00056     /*------------------------------------------------------------*/
00057 
00058     if ( FLA_Obj_is_real( A ) )
00059     {
00060       /* a01 = inv( tril( A00 )' ) * a01; */
00061       FLA_Trsv_external( FLA_UPPER_TRIANGULAR, FLA_TRANSPOSE, FLA_NONUNIT_DIAG, A00, a01 );
00062 
00063       /* alpha11 = alpha11 - a01' * a01; */
00064       FLA_Dots_external( FLA_MINUS_ONE, a01, a01, FLA_ONE, alpha11 );
00065 
00066       /* alpha11 = sqrt( alpha11 ); */
00067       value = FLA_Sqrt( alpha11 );
00068 
00069       if ( value != FLA_SUCCESS )
00070         return ( FLA_Obj_length( A00 ) + 1 );
00071     }
00072     else
00073     {
00074       /* a01 = inv( tril( A00 )' ) * a01; */
00075       FLA_Trsv_external( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG, A00, a01 );
00076 
00077       /* alpha11 = alpha11 - a01' * a01; */
00078       FLA_Dotcs_external( FLA_CONJUGATE, FLA_MINUS_ONE, a01, a01, FLA_ONE, alpha11 );
00079 
00080       /* alpha11 = sqrt( alpha11 ); */
00081       value = FLA_Sqrt( alpha11 );
00082 
00083       if ( value != FLA_SUCCESS )
00084         return ( FLA_Obj_length( A00 ) + 1 );
00085     }
00086 
00087     /*------------------------------------------------------------*/
00088 
00089     FLA_Cont_with_3x3_to_2x2( &ATL, /**/ &ATR,       A00,  a01,     /**/ A02,
00090                                                      a10t, alpha11, /**/ a12t,
00091                             /* ************** */  /* ************************ */
00092                               &ABL, /**/ &ABR,       A20,  a21,     /**/ A22,
00093                               FLA_TL );
00094   }
00095 
00096   return value;
00097 }

FLA_Error FLA_Chol_u_unb_var2 ( FLA_Obj  A  ) 

References FLA_Cont_with_3x3_to_2x2(), FLA_Dotcs_external(), FLA_Dots_external(), FLA_Gemv_external(), FLA_Gemvc_external(), FLA_Inv_scal_external(), FLA_MINUS_ONE, FLA_Obj_is_real(), FLA_Obj_length(), FLA_ONE, FLA_Part_2x2(), FLA_Repart_2x2_to_3x3(), and FLA_Sqrt().

00038 {
00039   FLA_Obj ATL,   ATR,      A00,  a01,     A02,
00040           ABL,   ABR,      a10t, alpha11, a12t,
00041                            A20,  a21,     A22;
00042 
00043   int value = 0;
00044 
00045   FLA_Part_2x2( A,    &ATL, &ATR,
00046                       &ABL, &ABR,     0, 0, FLA_TL );
00047 
00048   while ( FLA_Obj_length( ATL ) < FLA_Obj_length( A ) ){
00049 
00050     FLA_Repart_2x2_to_3x3( ATL, /**/ ATR,       &A00,  /**/ &a01,     &A02,
00051                         /* ************* */   /* ************************** */
00052                                                 &a10t, /**/ &alpha11, &a12t,
00053                            ABL, /**/ ABR,       &A20,  /**/ &a21,     &A22,
00054                            1, 1, FLA_BR );
00055 
00056     /*------------------------------------------------------------*/
00057 
00058     if ( FLA_Obj_is_real( A ) )
00059     {
00060       /* alpha11 = alpha11 - a01' * a01; */
00061       FLA_Dots_external( FLA_MINUS_ONE, a01, a01, FLA_ONE, alpha11 );
00062 
00063       /* a12t = a12t - a01' * A02; */
00064       /* a12t' = a12t' - A02' * a01; */
00065       FLA_Gemv_external( FLA_TRANSPOSE, FLA_MINUS_ONE, A02, a01, FLA_ONE, a12t );
00066 
00067       /* alpha11 = sqrt( alpha11 ); */
00068       value = FLA_Sqrt( alpha11 );
00069 
00070       if ( value != FLA_SUCCESS )
00071         return ( FLA_Obj_length( A00 ) + 1 );
00072 
00073       /* a12t = a12t / alpha11; */
00074       FLA_Inv_scal_external( alpha11, a12t );
00075     }
00076     else
00077     {
00078       /* alpha11 = alpha11 - a01' * a01; */
00079       FLA_Dotcs_external( FLA_CONJUGATE, FLA_MINUS_ONE, a01, a01, FLA_ONE, alpha11 );
00080 
00081       /* a12t = a12t - a01' * A02; */
00082       /* a12t' = a12t' - A02' * conj(a01); */
00083       FLA_Gemvc_external( FLA_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, A02, a01, FLA_ONE, a12t );
00084 
00085       /* alpha11 = sqrt( alpha11 ); */
00086       value = FLA_Sqrt( alpha11 );
00087 
00088       if ( value != FLA_SUCCESS )
00089         return ( FLA_Obj_length( A00 ) + 1 );
00090 
00091       /* a12t = a12t / alpha11; */
00092       FLA_Inv_scal_external( alpha11, a12t );
00093     }
00094 
00095     /*------------------------------------------------------------*/
00096 
00097     FLA_Cont_with_3x3_to_2x2( &ATL, /**/ &ATR,       A00,  a01,     /**/ A02,
00098                                                      a10t, alpha11, /**/ a12t,
00099                             /* ************** */  /* ************************ */
00100                               &ABL, /**/ &ABR,       A20,  a21,     /**/ A22,
00101                               FLA_TL );
00102   }
00103 
00104   return value;
00105 }

FLA_Error FLA_Chol_u_unb_var3 ( FLA_Obj  A  ) 

References FLA_Cont_with_3x3_to_2x2(), FLA_Herc_external(), FLA_Inv_scal_external(), FLA_MINUS_ONE, FLA_Obj_is_real(), FLA_Obj_length(), FLA_Part_2x2(), FLA_Repart_2x2_to_3x3(), FLA_Sqrt(), and FLA_Syr_external().

00038 {
00039   FLA_Obj ATL,   ATR,      A00,  a01,     A02,
00040           ABL,   ABR,      a10t, alpha11, a12t,
00041                            A20,  a21,     A22;
00042 
00043   int value = 0;
00044 
00045   FLA_Part_2x2( A,    &ATL, &ATR,
00046                       &ABL, &ABR,     0, 0, FLA_TL );
00047 
00048   while ( FLA_Obj_length( ATL ) < FLA_Obj_length( A ) ){
00049 
00050     FLA_Repart_2x2_to_3x3( ATL, /**/ ATR,       &A00,  /**/ &a01,     &A02,
00051                         /* ************* */   /* ************************** */
00052                                                 &a10t, /**/ &alpha11, &a12t,
00053                            ABL, /**/ ABR,       &A20,  /**/ &a21,     &A22,
00054                            1, 1, FLA_BR );
00055 
00056     /*------------------------------------------------------------*/
00057 
00058     if ( FLA_Obj_is_real( A ) )
00059     {
00060       /* alpha11 = sqrt( alpha11 ); */
00061       value = FLA_Sqrt( alpha11 );
00062   
00063       if ( value != FLA_SUCCESS )
00064         return ( FLA_Obj_length( A00 ) + 1 );
00065 
00066       /* a12t = a12t / alpha11; */
00067       FLA_Inv_scal_external( alpha11, a12t );
00068 
00069       /* A22 = A22 - a12t' * a12t; */
00070       FLA_Syr_external( FLA_UPPER_TRIANGULAR, FLA_MINUS_ONE, a12t, A22 );
00071     }
00072     else
00073     {
00074       /* alpha11 = sqrt( alpha11 ); */
00075       value = FLA_Sqrt( alpha11 );
00076   
00077       if ( value != FLA_SUCCESS )
00078         return ( FLA_Obj_length( A00 ) + 1 );
00079 
00080       /* a12t = a12t / alpha11; */
00081       FLA_Inv_scal_external( alpha11, a12t );
00082 
00083       /* A22 = A22 - a12t' * a12t; */
00084       FLA_Herc_external( FLA_UPPER_TRIANGULAR, FLA_CONJUGATE, FLA_MINUS_ONE, a12t, A22 );
00085     }
00086 
00087     /*------------------------------------------------------------*/
00088 
00089     FLA_Cont_with_3x3_to_2x2( &ATL, /**/ &ATR,       A00,  a01,     /**/ A02,
00090                                                      a10t, alpha11, /**/ a12t,
00091                             /* ************** */  /* ************************ */
00092                               &ABL, /**/ &ABR,       A20,  a21,     /**/ A22,
00093                               FLA_TL );
00094   }
00095 
00096   return value;
00097 }


Generated on Mon Jul 6 05:45:56 2009 for libflame by  doxygen 1.5.9