| /* |
| * Copyright (C) 2008 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| /* ---- includes ----------------------------------------------------------- */ |
| |
| #include "b_TensorEm/Flt16Mat3D.h" |
| #include "b_TensorEm/Functions.h" |
| #include "b_BasicEm/Math.h" |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| /* */ |
| /* ---- \ghd{ auxiliary functions } ---------------------------------------- */ |
| /* */ |
| /* ========================================================================= */ |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| /* */ |
| /* ---- \ghd{ constructor / destructor } ----------------------------------- */ |
| /* */ |
| /* ========================================================================= */ |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| void bts_Flt16Mat3D_init( struct bts_Flt16Mat3D* ptrA ) |
| { |
| ptrA->bbpE = 0; |
| ptrA->xxE = 0; |
| ptrA->xyE = 0; |
| ptrA->xzE = 0; |
| ptrA->yxE = 0; |
| ptrA->yyE = 0; |
| ptrA->yzE = 0; |
| ptrA->zxE = 0; |
| ptrA->zyE = 0; |
| ptrA->zzE = 0; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| void bts_Flt16Mat3D_exit( struct bts_Flt16Mat3D* ptrA ) |
| { |
| ptrA->bbpE = 0; |
| ptrA->xxE = 0; |
| ptrA->xyE = 0; |
| ptrA->xzE = 0; |
| ptrA->yxE = 0; |
| ptrA->yyE = 0; |
| ptrA->yzE = 0; |
| ptrA->zxE = 0; |
| ptrA->zyE = 0; |
| ptrA->zzE = 0; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| /* */ |
| /* ---- \ghd{ operators } -------------------------------------------------- */ |
| /* */ |
| /* ========================================================================= */ |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| /* */ |
| /* ---- \ghd{ query functions } -------------------------------------------- */ |
| /* */ |
| /* ========================================================================= */ |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| /* */ |
| /* ---- \ghd{ modify functions } ------------------------------------------- */ |
| /* */ |
| /* ========================================================================= */ |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| /* */ |
| /* ---- \ghd{ I/O } -------------------------------------------------------- */ |
| /* */ |
| /* ========================================================================= */ |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| uint32 bts_Flt16Mat3D_memSize( struct bbs_Context* cpA, |
| const struct bts_Flt16Mat3D *ptrA ) |
| { |
| return bbs_SIZEOF16( *ptrA ); |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| uint32 bts_Flt16Mat3D_memWrite( struct bbs_Context* cpA, |
| const struct bts_Flt16Mat3D* ptrA, |
| uint16* memPtrA ) |
| { |
| bbs_ERROR0( "not implemented" ); |
| return 0; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| uint32 bts_Flt16Mat3D_memRead( struct bbs_Context* cpA, |
| struct bts_Flt16Mat3D* ptrA, |
| const uint16* memPtrA ) |
| { |
| if( bbs_Context_error( cpA ) ) return 0; |
| bbs_ERROR0( "not implemented" ); |
| return 0; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| /* */ |
| /* ---- \ghd{ exec functions } --------------------------------------------- */ |
| /* */ |
| /* ========================================================================= */ |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| struct bts_Flt16Mat3D bts_Flt16Mat3D_createIdentity() |
| { |
| struct bts_Flt16Mat3D matL = { 1 << 14, 0, 0, 0, 1 << 14, 0, 0, 0, 1 << 14, 14 }; |
| return matL; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| struct bts_Flt16Mat3D bts_Flt16Mat3D_createScale( int32 scaleA, int32 scaleBbpA ) |
| { |
| struct bts_Flt16Mat3D matL = bts_Flt16Mat3D_createIdentity(); |
| bts_Flt16Mat3D_scale( &matL, scaleA, scaleBbpA ); |
| return matL; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| struct bts_Flt16Mat3D bts_Flt16Mat3D_create16( int16 xxA, int16 xyA, int16 xzA, |
| int16 yxA, int16 yyA, int16 yzA, |
| int16 zxA, int16 zyA, int16 zzA, |
| int16 bbpA ) |
| { |
| struct bts_Flt16Mat3D matL; |
| matL.xxE = xxA; |
| matL.xyE = xyA; |
| matL.xzE = xzA; |
| matL.yxE = yxA; |
| matL.yyE = yyA; |
| matL.yzE = yzA; |
| matL.zxE = zxA; |
| matL.zyE = zyA; |
| matL.zzE = zzA; |
| matL.bbpE = bbpA; |
| return matL; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| struct bts_Flt16Mat3D bts_Flt16Mat3D_create32( int32 xxA, int32 xyA, int32 xzA, |
| int32 yxA, int32 yyA, int32 yzA, |
| int32 zxA, int32 zyA, int32 zzA, |
| int32 bbpA ) |
| { |
| struct bts_Flt16Mat3D matL; |
| |
| if( ( xxA | xyA | xzA | yxA | yyA | yzA | zxA | zyA | zzA ) == 0 ) |
| { |
| matL.xxE = 0; |
| matL.xyE = 0; |
| matL.xzE = 0; |
| matL.yxE = 0; |
| matL.yyE = 0; |
| matL.yzE = 0; |
| matL.zxE = 0; |
| matL.zyE = 0; |
| matL.zzE = 0; |
| matL.bbpE = 0; |
| } |
| else |
| { |
| int32 xShiftL = bts_maxAbsIntLog2Of3( xxA, xyA, xzA ) - 13; |
| int32 yShiftL = bts_maxAbsIntLog2Of3( yxA, yyA, yzA ) - 13; |
| int32 zShiftL = bts_maxAbsIntLog2Of3( zxA, zyA, zzA ) - 13; |
| |
| int32 shiftL = bbs_max( bbs_max( xShiftL, yShiftL ), zShiftL ); |
| |
| if( shiftL > 0 ) |
| { |
| int32 sh1L = shiftL - 1; |
| matL.xxE = ( ( xxA >> sh1L ) + 1 ) >> 1; |
| matL.xyE = ( ( xyA >> sh1L ) + 1 ) >> 1; |
| matL.xzE = ( ( xzA >> sh1L ) + 1 ) >> 1; |
| matL.yxE = ( ( yxA >> sh1L ) + 1 ) >> 1; |
| matL.yyE = ( ( yyA >> sh1L ) + 1 ) >> 1; |
| matL.yzE = ( ( yzA >> sh1L ) + 1 ) >> 1; |
| matL.zxE = ( ( zxA >> sh1L ) + 1 ) >> 1; |
| matL.zyE = ( ( zyA >> sh1L ) + 1 ) >> 1; |
| matL.zzE = ( ( zzA >> sh1L ) + 1 ) >> 1; |
| } |
| else |
| { |
| matL.xxE = xxA << -shiftL; |
| matL.xyE = xyA << -shiftL; |
| matL.xzE = xzA << -shiftL; |
| matL.yxE = yxA << -shiftL; |
| matL.yyE = yyA << -shiftL; |
| matL.yzE = yzA << -shiftL; |
| matL.zxE = zxA << -shiftL; |
| matL.zyE = zyA << -shiftL; |
| matL.zzE = zzA << -shiftL; |
| } |
| |
| matL.bbpE = bbpA - shiftL; |
| } |
| return matL; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| void bts_Flt16Mat3D_scale( struct bts_Flt16Mat3D* ptrA, int32 scaleA, int32 scaleBbpA ) |
| { |
| /* fit scale in 15 bit */ |
| uint32 scaleExpL = bts_absIntLog2( scaleA ); |
| if( scaleExpL > 14 ) |
| { |
| int32 shiftL = scaleExpL - 14; |
| scaleA = ( ( scaleA >> ( shiftL - 1 ) ) + 1 ) >> 1; |
| scaleBbpA -= shiftL; |
| } |
| |
| *ptrA = bts_Flt16Mat3D_create32( ptrA->xxE * scaleA, ptrA->xyE * scaleA, ptrA->xzE * scaleA, |
| ptrA->yxE * scaleA, ptrA->yyE * scaleA, ptrA->yzE * scaleA, |
| ptrA->zxE * scaleA, ptrA->zyE * scaleA, ptrA->zzE * scaleA, |
| ptrA->bbpE + scaleBbpA ); |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| #ifndef HW_EE /* causes internal compiler error in ee-gcc */ |
| struct bts_Int16Vec3D bts_Flt16Mat3D_map( const struct bts_Flt16Mat3D* matPtrA, |
| const struct bts_Int16Vec3D* vecPtrA ) |
| { |
| struct bts_Int16Vec3D vecL; |
| |
| int32 xL = ( int32 ) matPtrA->xxE * vecPtrA->xE + ( int32 ) matPtrA->xyE * vecPtrA->yE + ( int32 ) matPtrA->xzE * vecPtrA->zE; |
| int32 yL = ( int32 ) matPtrA->yxE * vecPtrA->xE + ( int32 ) matPtrA->yyE * vecPtrA->yE + ( int32 ) matPtrA->yzE * vecPtrA->zE; |
| int32 zL = ( int32 ) matPtrA->zxE * vecPtrA->xE + ( int32 ) matPtrA->zyE * vecPtrA->yE + ( int32 ) matPtrA->zzE * vecPtrA->zE; |
| |
| if( matPtrA->bbpE > 0 ) |
| { |
| int32 sh1L = matPtrA->bbpE - 1; |
| vecL.xE = ( ( xL >> sh1L ) + 1 ) >> 1; |
| vecL.yE = ( ( yL >> sh1L ) + 1 ) >> 1; |
| vecL.zE = ( ( zL >> sh1L ) + 1 ) >> 1; |
| } |
| else |
| { |
| /* not overflow safe */ |
| vecL.xE = xL << -matPtrA->bbpE; |
| vecL.yE = yL << -matPtrA->bbpE; |
| vecL.zE = zL << -matPtrA->bbpE; |
| } |
| |
| return vecL; |
| } |
| #endif |
| /* ------------------------------------------------------------------------- */ |
| |
| struct bts_Flt16Vec3D bts_Flt16Mat3D_mapFlt( const struct bts_Flt16Mat3D* matPtrA, |
| const struct bts_Flt16Vec3D* vecPtrA ) |
| { |
| /* avoids overflow summing intermediate products */ |
| int32 xL = ( ( ( ( int32 ) matPtrA->xxE * vecPtrA->xE + 1 ) >> 1 ) + |
| ( ( ( int32 ) matPtrA->xyE * vecPtrA->yE + 1 ) >> 1 ) + |
| ( ( ( int32 ) matPtrA->xzE * vecPtrA->zE + 1 ) >> 1 ) ); |
| |
| int32 yL = ( ( ( ( int32 ) matPtrA->yxE * vecPtrA->xE + 1 ) >> 1 ) + |
| ( ( ( int32 ) matPtrA->yyE * vecPtrA->yE + 1 ) >> 1 ) + |
| ( ( ( int32 ) matPtrA->yzE * vecPtrA->zE + 1 ) >> 1 ) ); |
| |
| int32 zL = ( ( ( ( int32 ) matPtrA->zxE * vecPtrA->xE + 1 ) >> 1 ) + |
| ( ( ( int32 ) matPtrA->zyE * vecPtrA->yE + 1 ) >> 1 ) + |
| ( ( ( int32 ) matPtrA->zzE * vecPtrA->zE + 1 ) >> 1 ) ); |
| |
| |
| return bts_Flt16Vec3D_create32( xL, yL, zL, vecPtrA->bbpE + matPtrA->bbpE - 1 ); |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| struct bts_Flt16Mat3D bts_Flt16Mat3D_mul( const struct bts_Flt16Mat3D* mat1PtrA, |
| const struct bts_Flt16Mat3D* mat2PtrA ) |
| { |
| /* avoids overflow summing intermediate products */ |
| return bts_Flt16Mat3D_create32( |
| |
| ( ( ( int32 ) mat1PtrA->xxE * mat2PtrA->xxE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->xyE * mat2PtrA->yxE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->xzE * mat2PtrA->zxE + 1 ) >> 1 ), |
| ( ( ( int32 ) mat1PtrA->xxE * mat2PtrA->xyE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->xyE * mat2PtrA->yyE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->xzE * mat2PtrA->zyE + 1 ) >> 1 ), |
| ( ( ( int32 ) mat1PtrA->xxE * mat2PtrA->xzE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->xyE * mat2PtrA->yzE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->xzE * mat2PtrA->zzE + 1 ) >> 1 ), |
| |
| ( ( ( int32 ) mat1PtrA->yxE * mat2PtrA->xxE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->yyE * mat2PtrA->yxE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->yzE * mat2PtrA->zxE + 1 ) >> 1 ), |
| ( ( ( int32 ) mat1PtrA->yxE * mat2PtrA->xyE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->yyE * mat2PtrA->yyE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->yzE * mat2PtrA->zyE + 1 ) >> 1 ), |
| ( ( ( int32 ) mat1PtrA->yxE * mat2PtrA->xzE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->yyE * mat2PtrA->yzE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->yzE * mat2PtrA->zzE + 1 ) >> 1 ), |
| |
| ( ( ( int32 ) mat1PtrA->zxE * mat2PtrA->xxE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->zyE * mat2PtrA->yxE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->zzE * mat2PtrA->zxE + 1 ) >> 1 ), |
| ( ( ( int32 ) mat1PtrA->zxE * mat2PtrA->xyE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->zyE * mat2PtrA->yyE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->zzE * mat2PtrA->zyE + 1 ) >> 1 ), |
| ( ( ( int32 ) mat1PtrA->zxE * mat2PtrA->xzE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->zyE * mat2PtrA->yzE + 1 ) >> 1 ) + ( ( ( int32 ) mat1PtrA->zzE * mat2PtrA->zzE + 1 ) >> 1 ), |
| |
| mat1PtrA->bbpE + mat2PtrA->bbpE - 1 ); |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| struct bts_Flt16Mat3D* bts_Flt16Mat3D_mulTo( struct bts_Flt16Mat3D* mat1PtrA, |
| const struct bts_Flt16Mat3D* mat2PtrA ) |
| { |
| *mat1PtrA = bts_Flt16Mat3D_mul( mat1PtrA, mat2PtrA ); |
| return mat1PtrA; |
| } |
| |
| /* ------------------------------------------------------------------------- */ |
| |
| /* ========================================================================= */ |
| |