/* BLIS An object-based framework for developing high-performance BLAS-like libraries. Copyright (C) 2014, The University of Texas at Austin Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: - Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. - Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. - Neither the name(s) of the copyright holder(s) nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "blis.h" static const char* bli_ind_impl_str[BLIS_NUM_IND_METHODS] = { /* 1m */ "1m", /* nat */ "native", }; // ----------------------------------------------------------------------------- int bli_ind_init( void ) { // NOTE: If TLS is enabled, this function is called once by EACH application // thread per library init/finalize cycle (see bli_init.c). In this case, // the threads will initialize thread-local data (see bli_l3_ind.c). If TLS // is disabled, this function is called once by ONLY ONE application thread. // In neither case is a mutex needed to protect the data initialization. // NOTE: We intentionally call bli_gks_query_nat_cntx_noinit() in order // to avoid the internal call to bli_init_once(). const cntx_t* cntx = bli_gks_query_nat_cntx_noinit(); // For each precision, enable the default induced method (1m) if both of // the following conditions are met: // - the complex domain kernel is the (unoptimized) reference kernel // - the real domain kernel is NOT the (unoptimized) reference kernel // The second condition means that BLIS will not bother to use an induced // method if both the real and complex domain kernels are reference. bool s_is_ref = bli_gks_cntx_l3_nat_ukr_is_ref( BLIS_FLOAT, BLIS_GEMM_UKR, cntx ); bool d_is_ref = bli_gks_cntx_l3_nat_ukr_is_ref( BLIS_DOUBLE, BLIS_GEMM_UKR, cntx ); bool c_is_ref = bli_gks_cntx_l3_nat_ukr_is_ref( BLIS_SCOMPLEX, BLIS_GEMM_UKR, cntx ); bool z_is_ref = bli_gks_cntx_l3_nat_ukr_is_ref( BLIS_DCOMPLEX, BLIS_GEMM_UKR, cntx ); if ( c_is_ref && !s_is_ref ) bli_ind_enable_dt( BLIS_1M, BLIS_SCOMPLEX ); if ( z_is_ref && !d_is_ref ) bli_ind_enable_dt( BLIS_1M, BLIS_DCOMPLEX ); return 0; } int bli_ind_finalize( void ) { return 0; } // ----------------------------------------------------------------------------- void bli_ind_enable( ind_t method ) { bli_ind_enable_dt( method, BLIS_SCOMPLEX ); bli_ind_enable_dt( method, BLIS_DCOMPLEX ); } void bli_ind_disable( ind_t method ) { bli_ind_disable_dt( method, BLIS_SCOMPLEX ); bli_ind_disable_dt( method, BLIS_DCOMPLEX ); } void bli_ind_disable_all( void ) { bli_ind_disable_all_dt( BLIS_SCOMPLEX ); bli_ind_disable_all_dt( BLIS_DCOMPLEX ); } // ----------------------------------------------------------------------------- void bli_ind_enable_dt( ind_t method, num_t dt ) { if ( !bli_is_complex( dt ) ) return; bli_l3_ind_set_enable_dt( method, dt, TRUE ); } void bli_ind_disable_dt( ind_t method, num_t dt ) { if ( !bli_is_complex( dt ) ) return; bli_l3_ind_set_enable_dt( method, dt, FALSE ); } void bli_ind_disable_all_dt( num_t dt ) { ind_t im; for ( im = 0; im < BLIS_NUM_IND_METHODS; ++im ) { // Never disable native execution. if ( im != BLIS_NAT ) bli_ind_disable_dt( im, dt ); } } // ----------------------------------------------------------------------------- void bli_ind_oper_enable_only( opid_t oper, ind_t method, num_t dt ) { if ( !bli_is_complex( dt ) ) return; if ( bli_opid_is_level3( oper ) ) { bli_l3_ind_oper_enable_only( oper, method, dt ); } else { // Other operations are not implemented, so requests to enable // them for any given induced method are currently no-ops. ; } } // ----------------------------------------------------------------------------- bool bli_ind_oper_is_impl( opid_t oper, ind_t method ) { bool is_impl = FALSE; if ( bli_opid_is_level3( oper ) ) { // Look up whether the operation is implemented for the given induced // method id. is_impl = bli_l3_ind_oper_is_impl( oper, method ); } else { // All other operations should be reported as not implemented, // unless the requested check was for BLIS_NAT, in which case // all operations are implemented. if ( method == BLIS_NAT ) is_impl = TRUE; else is_impl = FALSE; } return is_impl; } ind_t bli_ind_oper_find_avail( opid_t oper, num_t dt ) { ind_t method; if ( bli_opid_is_level3( oper ) ) { method = bli_l3_ind_oper_find_avail( oper, dt ); } else { // Currently, any operation that is not level-3 is guaranteed // to be native. method = BLIS_NAT; } return method; } const char* bli_ind_oper_get_avail_impl_string( opid_t oper, num_t dt ) { ind_t method = bli_ind_oper_find_avail( oper, dt ); return bli_ind_get_impl_string( method ); } // ----------------------------------------------------------------------------- const char* bli_ind_get_impl_string( ind_t method ) { return bli_ind_impl_str[ method ]; } num_t bli_ind_map_cdt_to_index( num_t dt ) { // A non-complex datatype should never be passed in. if ( !bli_is_complex( dt ) ) bli_abort(); // Map the complex datatype to a zero-based index. if ( bli_is_scomplex( dt ) ) return 0; else /* if ( bli_is_dcomplex( dt ) ) */ return 1; }