[wxWidgets.git] / src / freetype / base / ftcalc.c

/***************************************************************************/
/*                                                                         */
/*  ftcalc.c                                                               */
/*                                                                         */
/*    Arithmetic computations (body).                                      */
/*                                                                         */
/*  Copyright 1996-2000 by                                                 */
/*  David Turner, Robert Wilhelm, and Werner Lemberg.                      */
/*                                                                         */
/*  This file is part of the FreeType project, and may only be used,       */
/*  modified, and distributed under the terms of the FreeType project      */
/*  license, LICENSE.TXT.  By continuing to use, modify, or distribute     */
/*  this file you indicate that you have read the license and              */
/*  understand and accept it fully.                                        */
/*                                                                         */
/***************************************************************************/

  /*************************************************************************/
  /*                                                                       */
  /* Support for 1-complement arithmetic has been totally dropped in this  */
  /* release.  You can still write your own code if you need it.           */
  /*                                                                       */
  /*************************************************************************/

  /*************************************************************************/
  /*                                                                       */
  /* Implementing basic computation routines.                              */
  /*                                                                       */
  /* FT_MulDiv(), FT_MulFix(), and FT_DivFix() are declared in freetype.h. */
  /*                                                                       */
  /*************************************************************************/


#include <freetype/internal/ftcalc.h>
#include <freetype/internal/ftdebug.h>
#include <freetype/internal/ftobjs.h>  /* for ABS() */


  /*************************************************************************/
  /*                                                                       */
  /* The macro FT_COMPONENT is used in trace mode.  It is an implicit      */
  /* parameter of the FT_TRACE() and FT_ERROR() macros, used to print/log  */
  /* messages during execution.                                            */
  /*                                                                       */
#undef  FT_COMPONENT
#define FT_COMPONENT  trace_calc


#ifdef FT_CONFIG_OPTION_OLD_CALCS

  static const FT_Long  ft_square_roots[63] =
  {
       1L,    1L,    2L,     3L,     4L,     5L,     8L,    11L,
      16L,   22L,   32L,    45L,    64L,    90L,   128L,   181L,
     256L,  362L,  512L,   724L,  1024L,  1448L,  2048L,  2896L,
    4096L, 5892L, 8192L, 11585L, 16384L, 23170L, 32768L, 46340L,

      65536L,   92681L,  131072L,   185363L,   262144L,   370727L,
     524288L,  741455L, 1048576L,  1482910L,  2097152L,  2965820L,
    4194304L, 5931641L, 8388608L, 11863283L, 16777216L, 23726566L,

      33554432L,   47453132L,   67108864L,   94906265L,
     134217728L,  189812531L,  268435456L,  379625062L,
     536870912L,  759250125L, 1073741824L, 1518500250L,
    2147483647L
  };

#else

  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_Sqrt32                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    Computes the square root of an Int32 integer (which will be        */
  /*    handled as an unsigned long value).                                */
  /*                                                                       */
  /* <Input>                                                               */
  /*    x :: The value to compute the root for.                            */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `sqrt(x)'.                                           */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Int32 )  FT_Sqrt32( FT_Int32  x )
  {
    FT_ULong  val, root, newroot, mask;


    root = 0;
    mask = 0x40000000L;
    val  = (FT_ULong)x;

    do
    {
      newroot = root + mask;
      if ( newroot <= val )
      {
        val -= newroot;
        root = newroot + mask;
      }

      root >>= 1;
      mask >>= 2;

    } while ( mask != 0 );

    return root;
  }

#endif /* FT_CONFIG_OPTION_OLD_CALCS */


#ifdef FT_LONG64

  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_MulDiv                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    A very simple function used to perform the computation `(a*b)/c'   */
  /*    with maximal accuracy (it uses a 64-bit intermediate integer       */
  /*    whenever necessary).                                               */
  /*                                                                       */
  /*    This function isn't necessarily as fast as some processor specific */
  /*    operations, but is at least completely portable.                   */
  /*                                                                       */
  /* <Input>                                                               */
  /*    a :: The first multiplier.                                         */
  /*    b :: The second multiplier.                                        */
  /*    c :: The divisor.                                                  */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `(a*b)/c'.  This function never traps when trying to */
  /*    divide by zero; it simply returns `MaxInt' or `MinInt' depending   */
  /*    on the signs of `a' and `b'.                                       */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Long )  FT_MulDiv( FT_Long  a,
                                        FT_Long  b,
                                        FT_Long  c )
  {
    FT_Int s;


    s = 1;
    if ( a < 0 ) { a = -a; s = -s; }
    if ( b < 0 ) { b = -b; s = -s; }
    if ( c < 0 ) { c = -c; s = -s; }

    return s * ( c > 0 ? ( (FT_Int64)a * b + ( c >> 1 ) ) / c
                       : 0x7FFFFFFFL );
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_MulFix                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    A very simple function used to perform the computation             */
  /*    `(a*b)/0x10000' with maximal accuracy.  Most of the time this is   */
  /*    used to multiply a given value by a 16.16 fixed float factor.      */
  /*                                                                       */
  /* <Input>                                                               */
  /*    a :: The first multiplier.                                         */
  /*    b :: The second multiplier.  Use a 16.16 factor here whenever      */
  /*         possible (see note below).                                    */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `(a*b)/0x10000'.                                     */
  /*                                                                       */
  /* <Note>                                                                */
  /*    This function has been optimized for the case where the absolute   */
  /*    value of `a' is less than 2048, and `b' is a 16.16 scaling factor. */
  /*    As this happens mainly when scaling from notional units to         */
  /*    fractional pixels in FreeType, it resulted in noticeable speed     */
  /*    improvements between versions 2.x and 1.x.                         */
  /*                                                                       */
  /*    As a conclusion, always try to place a 16.16 factor as the         */
  /*    _second_ argument of this function; this can make a great          */
  /*    difference.                                                        */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Long )  FT_MulFix( FT_Long  a,
                                        FT_Long  b )
  {
    FT_Int  s;


    s = 1;
    if ( a < 0 ) { a = -a; s = -s; }
    if ( b < 0 ) { b = -b; s = -s; }

    return s * (FT_Long)( ( (FT_Int64)a * b + 0x8000 ) >> 16 );
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_DivFix                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    A very simple function used to perform the computation             */
  /*    `(a*0x10000)/b' with maximal accuracy.  Most of the time, this is  */
  /*    used to divide a given value by a 16.16 fixed float factor.        */
  /*                                                                       */
  /* <Input>                                                               */
  /*    a :: The first multiplier.                                         */
  /*    b :: The second multiplier.  Use a 16.16 factor here whenever      */
  /*         possible (see note below).                                    */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `(a*0x10000)/b'.                                     */
  /*                                                                       */
  /* <Note>                                                                */
  /*    The optimization for FT_DivFix() is simple: If (a << 16) fits in   */
  /*    32 bits, then the division is computed directly.  Otherwise, we    */
  /*    use a specialized version of the old FT_MulDiv64().                */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Long )  FT_DivFix( FT_Long  a,
                                        FT_Long  b )
  {
    FT_Int32   s;
    FT_UInt32  q;


    s  = a; a = ABS(a);
    s ^= b; b = ABS(b);

    if ( b == 0 )
      /* check for division by 0 */
      q = 0x7FFFFFFFL;
    else
      /* compute result directly */
      q = ( (FT_Int64)a << 16 ) / b;

    return (FT_Int32)( s < 0 ? -q : q );
  }


#ifdef FT_CONFIG_OPTION_OLD_CALCS

  /* a helper function for FT_Sqrt64() */

  static
  int  ft_order64( FT_Int64  z )
  {
    int  j = 0;


    while ( z )
    {
      z = (unsigned FT_INT64)z >> 1;
      j++;
    }
    return j - 1;
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_Sqrt64                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    Computes the square root of a 64-bit value.  That sounds stupid,   */
  /*    but it is needed to obtain maximal accuracy in the TrueType        */
  /*    bytecode interpreter.                                              */
  /*                                                                       */
  /* <Input>                                                               */
  /*    l :: A 64-bit integer.                                             */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The 32-bit square-root.                                            */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Int32 )  FT_Sqrt64( FT_Int64  l )
  {
    FT_Int64  r, s;


    if ( l <= 0 ) return 0;
    if ( l == 1 ) return 1;

    r = ft_square_roots[ft_order64( l )];

    do
    {
      s = r;
      r = ( r + l / r ) >> 1;

    } while ( r > s || r * r > l );

    return r;
  }

#endif /* FT_CONFIG_OPTION_OLD_CALCS */


#else /* FT_LONG64 */


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_MulDiv                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    A very simple function used to perform the computation `(a*b)/c'   */
  /*    with maximal accuracy (it uses a 64-bit intermediate integer       */
  /*    whenever necessary).                                               */
  /*                                                                       */
  /*    This function isn't necessarily as fast as some processor specific */
  /*    operations, but is at least completely portable.                   */
  /*                                                                       */
  /* <Input>                                                               */
  /*    a :: The first multiplier.                                         */
  /*    b :: The second multiplier.                                        */
  /*    c :: The divisor.                                                  */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `(a*b)/c'.  This function never traps when trying to */
  /*    divide by zero; it simply returns `MaxInt' or `MinInt' depending   */
  /*    on the signs of `a' and `b'.                                       */
  /*                                                                       */
  /* <Note>                                                                */
  /*    The FT_MulDiv() function has been optimized thanks to ideas from   */
  /*    Graham Asher.  The trick is to optimize computation if everything  */
  /*    fits within 32 bits (a rather common case).                        */
  /*                                                                       */
  /*    We compute `a*b+c/2', then divide it by `c' (positive values).     */
  /*                                                                       */
  /*      46340 is FLOOR(SQRT(2^31-1)).                                    */
  /*                                                                       */
  /*      if ( a <= 46340 && b <= 46340 ) then ( a*b <= 0x7FFEA810 )       */
  /*                                                                       */
  /*      0x7FFFFFFF - 0x7FFEA810 = 0x157F0                                */
  /*                                                                       */
  /*      if ( c < 0x157F0*2 ) then ( a*b+c/2 <= 0x7FFFFFFF )              */
  /*                                                                       */
  /*      and 2*0x157F0 = 176096.                                          */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Long )  FT_MulDiv( FT_Long  a,
                                        FT_Long  b,
                                        FT_Long  c )
  {
    long   s;


    if ( a == 0 || b == c )
      return a;

    s  = a; a = ABS( a );
    s ^= b; b = ABS( b );
    s ^= c; c = ABS( c );

    if ( a <= 46340 && b <= 46340 && c <= 176095L && c > 0 )
    {
      a = ( a * b + ( c >> 1 ) ) / c;
    }
    else if ( c > 0 )
    {
      FT_Int64  temp, temp2;


      FT_MulTo64( a, b, &temp );
      temp2.hi = (FT_Int32)( c >> 31 );
      temp2.lo = (FT_UInt32)( c / 2 );
      FT_Add64( &temp, &temp2, &temp );
      a = FT_Div64by32( &temp, c );
    }
    else
      a = 0x7FFFFFFFL;

    return ( s < 0 ? -a : a );
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_MulFix                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    A very simple function used to perform the computation             */
  /*    `(a*b)/0x10000' with maximal accuracy.  Most of the time, this is  */
  /*    used to multiply a given value by a 16.16 fixed float factor.      */
  /*                                                                       */
  /* <Input>                                                               */
  /*    a :: The first multiplier.                                         */
  /*    b :: The second multiplier.  Use a 16.16 factor here whenever      */
  /*         possible (see note below).                                    */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `(a*b)/0x10000'.                                     */
  /*                                                                       */
  /* <Note>                                                                */
  /*    The optimization for FT_MulFix() is different.  We could simply be */
  /*    happy by applying the same principles as with FT_MulDiv(), because */
  /*                                                                       */
  /*      c = 0x10000 < 176096                                             */
  /*                                                                       */
  /*    However, in most cases, we have a `b' with a value around 0x10000  */
  /*    which is greater than 46340.                                       */
  /*                                                                       */
  /*    According to some testing, most cases have `a' < 2048, so a good   */
  /*    idea is to use bounds like 2048 and 1048576 (=floor((2^31-1)/2048) */
  /*    for `a' and `b', respectively.                                     */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Long )  FT_MulFix( FT_Long  a,
                                        FT_Long  b )
  {
    FT_Long   s;
    FT_ULong  ua, ub;


    if ( a == 0 || b == 0x10000L )
      return a;

    s  = a; a = ABS(a);
    s ^= b; b = ABS(b);

    ua = (FT_ULong)a;
    ub = (FT_ULong)b;

    if ( ua <= 2048 && ub <= 1048576L )
    {
      ua = ( ua * ub + 0x8000 ) >> 16;
    }
    else
    {
      FT_ULong  al = ua & 0xFFFF;


      ua = ( ua >> 16 ) * ub +
           al * ( ub >> 16 ) +
           ( al * ( ub & 0xFFFF ) >> 16 );
    }

    return ( s < 0 ? -(FT_Long)ua : ua );
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_DivFix                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    A very simple function used to perform the computation             */
  /*    `(a*0x10000)/b' with maximal accuracy.  Most of the time, this is  */
  /*    used to divide a given value by a 16.16 fixed float factor.        */
  /*                                                                       */
  /* <Input>                                                               */
  /*    a :: The first multiplier.                                         */
  /*    b :: The second multiplier.  Use a 16.16 factor here whenever      */
  /*         possible (see note below).                                    */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `(a*0x10000)/b'.                                     */
  /*                                                                       */
  /* <Note>                                                                */
  /*    The optimization for FT_DivFix() is simple: If (a << 16) fits into */
  /*    32 bits, then the division is computed directly.  Otherwise, we    */
  /*    use a specialized version of the old FT_MulDiv64().                */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Long )  FT_DivFix( FT_Long  a,
                                        FT_Long  b )
  {
    FT_Int32   s;
    FT_UInt32  q;


    s  = a; a = ABS(a);
    s ^= b; b = ABS(b);

    if ( b == 0 )
    {
      /* check for division by 0 */
      q = 0x7FFFFFFFL;
    }
    else if ( ( a >> 16 ) == 0 )
    {
      /* compute result directly */
      q = (FT_UInt32)( a << 16 ) / (FT_UInt32)b;
    }
    else
    {
      /* we need more bits; we have to do it by hand */
      FT_UInt32  c;


      q  = ( a / b ) << 16;
      c  = a % b;

      /* we must compute C*0x10000/B: we simply shift C and B so */
      /* C becomes smaller than 16 bits                          */
      while ( c >> 16 )
      {
        c >>= 1;
        b <<= 1;
      }

      q += ( c << 16 ) / b;
    }

    return ( s < 0 ? -(FT_Int32)q : (FT_Int32)q );
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_Add64                                                           */
  /*                                                                       */
  /* <Description>                                                         */
  /*    Add two Int64 values.                                              */
  /*                                                                       */
  /* <Input>                                                               */
  /*    x :: A pointer to the first value to be added.                     */
  /*    y :: A pointer to the second value to be added.                    */
  /*                                                                       */
  /* <Output>                                                              */
  /*    z :: A pointer to the result of `x + y'.                           */
  /*                                                                       */
  /* <Note>                                                                */
  /*    Will be wrapped by the ADD_64() macro.                             */
  /*                                                                       */
  FT_EXPORT_FUNC( void )  FT_Add64( FT_Int64*  x,
                                    FT_Int64*  y,
                                    FT_Int64*  z )
  {
    register FT_UInt32  lo, hi;


    lo = x->lo + y->lo;
    hi = x->hi + y->hi + ( lo < x->lo );

    z->lo = lo;
    z->hi = hi;
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_MulTo64                                                         */
  /*                                                                       */
  /* <Description>                                                         */
  /*    Multiplies two Int32 integers.  Returns an Int64 integer.          */
  /*                                                                       */
  /* <Input>                                                               */
  /*    x :: The first multiplier.                                         */
  /*    y :: The second multiplier.                                        */
  /*                                                                       */
  /* <Output>                                                              */
  /*    z :: A pointer to the result of `x * y'.                           */
  /*                                                                       */
  /* <Note>                                                                */
  /*    Will be wrapped by the MUL_64() macro.                             */
  /*                                                                       */
  FT_EXPORT_FUNC( void )  FT_MulTo64( FT_Int32   x,
                                      FT_Int32   y,
                                      FT_Int64*  z )
  {
    FT_Int32   s;


    s  = x; x = ABS( x );
    s ^= y; y = ABS( y );

    {
      FT_UInt32  lo1, hi1, lo2, hi2, lo, hi, i1, i2;


      lo1 = x & 0x0000FFFF;  hi1 = x >> 16;
      lo2 = y & 0x0000FFFF;  hi2 = y >> 16;

      lo = lo1 * lo2;
      i1 = lo1 * hi2;
      i2 = lo2 * hi1;
      hi = hi1 * hi2;

      /* Check carry overflow of i1 + i2 */
      i1 += i2;
      if ( i1 < i2 )
        hi += 1L << 16;

      hi += i1 >> 16;
      i1  = i1 << 16;

      /* Check carry overflow of i1 + lo */
      lo += i1;
      hi += ( lo < i1 );

      z->lo = lo;
      z->hi = hi;
    }

    if ( s < 0 )
    {
      z->lo = (FT_UInt32)-(FT_Int32)z->lo;
      z->hi = ~z->hi + !( z->lo );
    }
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_Div64by32                                                       */
  /*                                                                       */
  /* <Description>                                                         */
  /*    Divides an Int64 value by an Int32 value.  Returns an Int32        */
  /*    integer.                                                           */
  /*                                                                       */
  /* <Input>                                                               */
  /*    x :: A pointer to the dividend.                                    */
  /*    y :: The divisor.                                                  */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The result of `x / y'.                                             */
  /*                                                                       */
  /* <Note>                                                                */
  /*    Will be wrapped by the DIV_64() macro.                             */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Int32 )  FT_Div64by32( FT_Int64*  x,
                                            FT_Int32   y )
  {
    FT_Int32   s;
    FT_UInt32  q, r, i, lo;


    s  = x->hi;
    if ( s < 0 )
    {
      x->lo = (FT_UInt32)-(FT_Int32)x->lo;
      x->hi = ~x->hi + !( x->lo );
    }
    s ^= y;  y = ABS( y );

    /* Shortcut */
    if ( x->hi == 0 )
    {
      if ( y > 0 )
        q = x->lo / y;
      else
        q = 0x7FFFFFFFL;

      return ( s < 0 ? -(FT_Int32)q : (FT_Int32)q );
    }

    r  = x->hi;
    lo = x->lo;

    if ( r >= (FT_UInt32)y ) /* we know y is to be treated as unsigned here */
      return ( s < 0 ? 0x80000001UL : 0x7FFFFFFFUL );
                             /* Return Max/Min Int32 if division overflow.  */
                             /* This includes division by zero!             */
    q = 0;
    for ( i = 0; i < 32; i++ )
    {
      r <<= 1;
      q <<= 1;
      r  |= lo >> 31;

      if ( r >= (FT_UInt32)y )
      {
        r -= y;
        q |= 1;
      }
      lo <<= 1;
    }

    return ( s < 0 ? -(FT_Int32)q : (FT_Int32)q );
  }


#ifdef FT_CONFIG_OPTION_OLD_CALCS


  /* two helper functions for FT_Sqrt64() */

  static
  void  FT_Sub64( FT_Int64*  x,
                  FT_Int64*  y,
                  FT_Int64*  z )
  {
    register FT_UInt32  lo, hi;


    lo = x->lo - y->lo;
    hi = x->hi - y->hi - ( (FT_Int32)lo < 0 );

    z->lo = lo;
    z->hi = hi;
  }


  static
  int  ft_order64( FT_Int64*  z )
  {
    FT_UInt32  i;
    int        j;


    i = z->lo;
    j = 0;
    if ( z->hi )
    {
      i = z->hi;
      j = 32;
    }

    while ( i > 0 )
    {
      i >>= 1;
      j++;
    }
    return j - 1;
  }


  /*************************************************************************/
  /*                                                                       */
  /* <Function>                                                            */
  /*    FT_Sqrt64                                                          */
  /*                                                                       */
  /* <Description>                                                         */
  /*    Computes the square root of a 64-bits value.  That sounds stupid,  */
  /*    but it is needed to obtain maximal accuracy in the TrueType        */
  /*    bytecode interpreter.                                              */
  /*                                                                       */
  /* <Input>                                                               */
  /*    z :: A pointer to a 64-bit integer.                                */
  /*                                                                       */
  /* <Return>                                                              */
  /*    The 32-bit square-root.                                            */
  /*                                                                       */
  FT_EXPORT_FUNC( FT_Int32 )  FT_Sqrt64( FT_Int64*  l )
  {
    FT_Int64  l2;
    FT_Int32  r, s;


    if ( (FT_Int32)l->hi < 0          ||
         ( l->hi == 0 && l->lo == 0 ) )
      return 0;

    s = ft_order64( l );
    if ( s == 0 )
      return 1;

    r = ft_square_roots[s];
    do
    {
      s = r;
      r = ( r + FT_Div64by32( l, r ) ) >> 1;
      FT_MulTo64( r, r,   &l2 );
      FT_Sub64  ( l, &l2, &l2 );

    } while ( r > s || (FT_Int32)l2.hi < 0 );

    return r;
  }

#endif /* FT_CONFIG_OPTION_OLD_CALCS */

#endif /* FT_LONG64 */


/* END */
Commit	Line	Data
cabec872 RR	1	/***************************************************************************/
	2	/* */
	3	/* ftcalc.c */
	4	/* */
	5	/* Arithmetic computations (body). */
	6	/* */
	7	/* Copyright 1996-2000 by */
	8	/* David Turner, Robert Wilhelm, and Werner Lemberg. */
	9	/* */
	10	/* This file is part of the FreeType project, and may only be used, */
	11	/* modified, and distributed under the terms of the FreeType project */
	12	/* license, LICENSE.TXT. By continuing to use, modify, or distribute */
	13	/* this file you indicate that you have read the license and */
	14	/* understand and accept it fully. */
	15	/* */
	16	/***************************************************************************/
	17
	18	/*************************************************************************/
	19	/* */
	20	/* Support for 1-complement arithmetic has been totally dropped in this */
	21	/* release. You can still write your own code if you need it. */
	22	/* */
	23	/*************************************************************************/
	24
	25	/*************************************************************************/
	26	/* */
	27	/* Implementing basic computation routines. */
	28	/* */
	29	/* FT_MulDiv(), FT_MulFix(), and FT_DivFix() are declared in freetype.h. */
	30	/* */
	31	/*************************************************************************/
	32
	33
	34	#include <freetype/internal/ftcalc.h>
	35	#include <freetype/internal/ftdebug.h>
	36	#include <freetype/internal/ftobjs.h> /* for ABS() */
	37
	38
	39	/*************************************************************************/
	40	/* */
	41	/* The macro FT_COMPONENT is used in trace mode. It is an implicit */
	42	/* parameter of the FT_TRACE() and FT_ERROR() macros, used to print/log */
	43	/* messages during execution. */
	44	/* */
	45	#undef FT_COMPONENT
	46	#define FT_COMPONENT trace_calc
	47
	48
	49	#ifdef FT_CONFIG_OPTION_OLD_CALCS
	50
	51	static const FT_Long ft_square_roots[63] =
	52	{
	53	1L, 1L, 2L, 3L, 4L, 5L, 8L, 11L,
	54	16L, 22L, 32L, 45L, 64L, 90L, 128L, 181L,
	55	256L, 362L, 512L, 724L, 1024L, 1448L, 2048L, 2896L,
	56	4096L, 5892L, 8192L, 11585L, 16384L, 23170L, 32768L, 46340L,
	57
	58	65536L, 92681L, 131072L, 185363L, 262144L, 370727L,
	59	524288L, 741455L, 1048576L, 1482910L, 2097152L, 2965820L,
	60	4194304L, 5931641L, 8388608L, 11863283L, 16777216L, 23726566L,
	61
	62	33554432L, 47453132L, 67108864L, 94906265L,
	63	134217728L, 189812531L, 268435456L, 379625062L,
	64	536870912L, 759250125L, 1073741824L, 1518500250L,
65	2147483647L
66	};
67
68	#else
69
70	/*************************************************************************/
71	/* */
72	/* <Function> */
73	/* FT_Sqrt32 */
74	/* */
75	/* <Description> */
76	/* Computes the square root of an Int32 integer (which will be */
77	/* handled as an unsigned long value). */
78	/* */
79	/* <Input> */
80	/* x :: The value to compute the root for. */
81	/* */
82	/* <Return> */
83	/* The result of `sqrt(x)'. */
84	/* */
85	FT_EXPORT_FUNC( FT_Int32 ) FT_Sqrt32( FT_Int32 x )
86	{
87	FT_ULong val, root, newroot, mask;
88
89
90	root = 0;
91	mask = 0x40000000L;
92	val = (FT_ULong)x;
93
94	do
95	{
96	newroot = root + mask;
97	if ( newroot <= val )
98	{
99	val -= newroot;
100	root = newroot + mask;
101	}
102
103	root >>= 1;
104	mask >>= 2;
105
106	} while ( mask != 0 );
107
108	return root;
109	}
110
111	#endif /* FT_CONFIG_OPTION_OLD_CALCS */
112
113
114	#ifdef FT_LONG64
115
116	/*************************************************************************/
117	/* */
118	/* <Function> */
119	/* FT_MulDiv */
120	/* */
121	/* <Description> */
122	/* A very simple function used to perform the computation `(ab)/c' /
123	/* with maximal accuracy (it uses a 64-bit intermediate integer */
124	/* whenever necessary). */
125	/* */
126	/* This function isn't necessarily as fast as some processor specific */
127	/* operations, but is at least completely portable. */
128	/* */
129	/* <Input> */
130	/* a :: The first multiplier. */
131	/* b :: The second multiplier. */
132	/* c :: The divisor. */
133	/* */
134	/* <Return> */
135	/* The result of `(ab)/c'. This function never traps when trying to /
136	/* divide by zero; it simply returns `MaxInt' or `MinInt' depending */
137	/* on the signs of `a' and `b'. */
138	/* */
139	FT_EXPORT_FUNC( FT_Long ) FT_MulDiv( FT_Long a,
140	FT_Long b,
141	FT_Long c )
142	{
143	FT_Int s;
144
145
146	s = 1;
147	if ( a < 0 ) { a = -a; s = -s; }
148	if ( b < 0 ) { b = -b; s = -s; }
149	if ( c < 0 ) { c = -c; s = -s; }
150
151	return s * ( c > 0 ? ( (FT_Int64)a * b + ( c >> 1 ) ) / c
152	: 0x7FFFFFFFL );
153	}
154
155
156	/*************************************************************************/
157	/* */
158	/* <Function> */
159	/* FT_MulFix */
160	/* */
161	/* <Description> */
162	/* A very simple function used to perform the computation */
163	/* `(ab)/0x10000' with maximal accuracy. Most of the time this is /
164	/* used to multiply a given value by a 16.16 fixed float factor. */
165	/* */
166	/* <Input> */
167	/* a :: The first multiplier. */
168	/* b :: The second multiplier. Use a 16.16 factor here whenever */
169	/* possible (see note below). */
170	/* */
171	/* <Return> */
172	/* The result of `(ab)/0x10000'. /
173	/* */
174	/* <Note> */
175	/* This function has been optimized for the case where the absolute */
176	/* value of `a' is less than 2048, and `b' is a 16.16 scaling factor. */
177	/* As this happens mainly when scaling from notional units to */
178	/* fractional pixels in FreeType, it resulted in noticeable speed */
179	/* improvements between versions 2.x and 1.x. */
180	/* */
181	/* As a conclusion, always try to place a 16.16 factor as the */
182	/* _second_ argument of this function; this can make a great */
183	/* difference. */
184	/* */
185	FT_EXPORT_FUNC( FT_Long ) FT_MulFix( FT_Long a,
186	FT_Long b )
187	{
188	FT_Int s;
189
190
191	s = 1;
192	if ( a < 0 ) { a = -a; s = -s; }
193	if ( b < 0 ) { b = -b; s = -s; }
194
195	return s * (FT_Long)( ( (FT_Int64)a * b + 0x8000 ) >> 16 );
196	}
197
198
199	/*************************************************************************/
200	/* */
201	/* <Function> */
202	/* FT_DivFix */
203	/* */
204	/* <Description> */
205	/* A very simple function used to perform the computation */
206	/* `(a0x10000)/b' with maximal accuracy. Most of the time, this is /
207	/* used to divide a given value by a 16.16 fixed float factor. */
208	/* */
209	/* <Input> */
210	/* a :: The first multiplier. */
211	/* b :: The second multiplier. Use a 16.16 factor here whenever */
212	/* possible (see note below). */
213	/* */
214	/* <Return> */
215	/* The result of `(a0x10000)/b'. /
216	/* */
217	/* <Note> */
218	/* The optimization for FT_DivFix() is simple: If (a << 16) fits in */
219	/* 32 bits, then the division is computed directly. Otherwise, we */
220	/* use a specialized version of the old FT_MulDiv64(). */
221	/* */
222	FT_EXPORT_FUNC( FT_Long ) FT_DivFix( FT_Long a,
223	FT_Long b )
224	{
225	FT_Int32 s;
226	FT_UInt32 q;
227
228
229	s = a; a = ABS(a);
230	s ^= b; b = ABS(b);
231
232	if ( b == 0 )
233	/* check for division by 0 */
234	q = 0x7FFFFFFFL;
235	else
236	/* compute result directly */
237	q = ( (FT_Int64)a << 16 ) / b;
238
239	return (FT_Int32)( s < 0 ? -q : q );
240	}
241
242
243	#ifdef FT_CONFIG_OPTION_OLD_CALCS
244
245	/* a helper function for FT_Sqrt64() */
246
247	static
248	int ft_order64( FT_Int64 z )
249	{
250	int j = 0;
251
252
253	while ( z )
254	{
255	z = (unsigned FT_INT64)z >> 1;
256	j++;
257	}
258	return j - 1;
259	}
260
261
262	/*************************************************************************/
263	/* */
264	/* <Function> */
265	/* FT_Sqrt64 */
266	/* */
267	/* <Description> */
268	/* Computes the square root of a 64-bit value. That sounds stupid, */
269	/* but it is needed to obtain maximal accuracy in the TrueType */
270	/* bytecode interpreter. */
271	/* */
272	/* <Input> */
273	/* l :: A 64-bit integer. */
274	/* */
275	/* <Return> */
276	/* The 32-bit square-root. */
277	/* */
278	FT_EXPORT_FUNC( FT_Int32 ) FT_Sqrt64( FT_Int64 l )
279	{
280	FT_Int64 r, s;
281
282
283	if ( l <= 0 ) return 0;
284	if ( l == 1 ) return 1;
285
286	r = ft_square_roots[ft_order64( l )];
287
288	do
289	{
290	s = r;
291	r = ( r + l / r ) >> 1;
292
293	} while ( r > s \|\| r * r > l );
294
295	return r;
296	}
297
298	#endif /* FT_CONFIG_OPTION_OLD_CALCS */
299
300
301	#else /* FT_LONG64 */
302
303
304	/*************************************************************************/
305	/* */
306	/* <Function> */
307	/* FT_MulDiv */
308	/* */
309	/* <Description> */
310	/* A very simple function used to perform the computation `(ab)/c' /
311	/* with maximal accuracy (it uses a 64-bit intermediate integer */
312	/* whenever necessary). */
313	/* */
314	/* This function isn't necessarily as fast as some processor specific */
315	/* operations, but is at least completely portable. */
316	/* */
317	/* <Input> */
318	/* a :: The first multiplier. */
319	/* b :: The second multiplier. */
320	/* c :: The divisor. */
321	/* */
322	/* <Return> */
323	/* The result of `(ab)/c'. This function never traps when trying to /
324	/* divide by zero; it simply returns `MaxInt' or `MinInt' depending */
325	/* on the signs of `a' and `b'. */
326	/* */
327	/* <Note> */
328	/* The FT_MulDiv() function has been optimized thanks to ideas from */
329	/* Graham Asher. The trick is to optimize computation if everything */
330	/* fits within 32 bits (a rather common case). */
331	/* */
332	/* We compute `ab+c/2', then divide it by `c' (positive values). /
333	/* */
334	/* 46340 is FLOOR(SQRT(2^31-1)). */
335	/* */
336	/* if ( a <= 46340 && b <= 46340 ) then ( ab <= 0x7FFEA810 ) /
337	/* */
338	/* 0x7FFFFFFF - 0x7FFEA810 = 0x157F0 */
339	/* */
340	/* if ( c < 0x157F02 ) then ( ab+c/2 <= 0x7FFFFFFF ) */
341	/* */
342	/* and 20x157F0 = 176096. /
343	/* */
344	FT_EXPORT_FUNC( FT_Long ) FT_MulDiv( FT_Long a,
345	FT_Long b,
346	FT_Long c )
347	{
348	long s;
349
350
351	if ( a == 0 \|\| b == c )
352	return a;
353
354	s = a; a = ABS( a );
355	s ^= b; b = ABS( b );
356	s ^= c; c = ABS( c );
357
358	if ( a <= 46340 && b <= 46340 && c <= 176095L && c > 0 )
359	{
360	a = ( a * b + ( c >> 1 ) ) / c;
361	}
362	else if ( c > 0 )
363	{
364	FT_Int64 temp, temp2;
365
366
367	FT_MulTo64( a, b, &temp );
368	temp2.hi = (FT_Int32)( c >> 31 );
369	temp2.lo = (FT_UInt32)( c / 2 );
370	FT_Add64( &temp, &temp2, &temp );
371	a = FT_Div64by32( &temp, c );
372	}
373	else
374	a = 0x7FFFFFFFL;
375
376	return ( s < 0 ? -a : a );
377	}
378
379
380	/*************************************************************************/
381	/* */
382	/* <Function> */
383	/* FT_MulFix */
384	/* */
385	/* <Description> */
386	/* A very simple function used to perform the computation */
387	/* `(ab)/0x10000' with maximal accuracy. Most of the time, this is /
388	/* used to multiply a given value by a 16.16 fixed float factor. */
389	/* */
390	/* <Input> */
391	/* a :: The first multiplier. */
392	/* b :: The second multiplier. Use a 16.16 factor here whenever */
393	/* possible (see note below). */
394	/* */
395	/* <Return> */
396	/* The result of `(ab)/0x10000'. /
397	/* */
398	/* <Note> */
399	/* The optimization for FT_MulFix() is different. We could simply be */
400	/* happy by applying the same principles as with FT_MulDiv(), because */
401	/* */
402	/* c = 0x10000 < 176096 */
403	/* */
404	/* However, in most cases, we have a `b' with a value around 0x10000 */
405	/* which is greater than 46340. */
406	/* */
407	/* According to some testing, most cases have `a' < 2048, so a good */
408	/* idea is to use bounds like 2048 and 1048576 (=floor((2^31-1)/2048) */
409	/* for `a' and `b', respectively. */
410	/* */
411	FT_EXPORT_FUNC( FT_Long ) FT_MulFix( FT_Long a,
412	FT_Long b )
413	{
414	FT_Long s;
415	FT_ULong ua, ub;
416
417
418	if ( a == 0 \|\| b == 0x10000L )
419	return a;
420
421	s = a; a = ABS(a);
422	s ^= b; b = ABS(b);
423
424	ua = (FT_ULong)a;
425	ub = (FT_ULong)b;
426
427	if ( ua <= 2048 && ub <= 1048576L )
428	{
429	ua = ( ua * ub + 0x8000 ) >> 16;
430	}
431	else
432	{
433	FT_ULong al = ua & 0xFFFF;
434
435
436	ua = ( ua >> 16 ) * ub +
437	al * ( ub >> 16 ) +
438	( al * ( ub & 0xFFFF ) >> 16 );
439	}
440
441	return ( s < 0 ? -(FT_Long)ua : ua );
442	}
443
444
445	/*************************************************************************/
446	/* */
447	/* <Function> */
448	/* FT_DivFix */
449	/* */
450	/* <Description> */
451	/* A very simple function used to perform the computation */
452	/* `(a0x10000)/b' with maximal accuracy. Most of the time, this is /
453	/* used to divide a given value by a 16.16 fixed float factor. */
454	/* */
455	/* <Input> */
456	/* a :: The first multiplier. */
457	/* b :: The second multiplier. Use a 16.16 factor here whenever */
458	/* possible (see note below). */
459	/* */
460	/* <Return> */
461	/* The result of `(a0x10000)/b'. /
462	/* */
463	/* <Note> */
464	/* The optimization for FT_DivFix() is simple: If (a << 16) fits into */
465	/* 32 bits, then the division is computed directly. Otherwise, we */
466	/* use a specialized version of the old FT_MulDiv64(). */
467	/* */
468	FT_EXPORT_FUNC( FT_Long ) FT_DivFix( FT_Long a,
469	FT_Long b )
470	{
471	FT_Int32 s;
472	FT_UInt32 q;
473
474
475	s = a; a = ABS(a);
476	s ^= b; b = ABS(b);
477
478	if ( b == 0 )
479	{
480	/* check for division by 0 */
481	q = 0x7FFFFFFFL;
482	}
483	else if ( ( a >> 16 ) == 0 )
484	{
485	/* compute result directly */
486	q = (FT_UInt32)( a << 16 ) / (FT_UInt32)b;
487	}
488	else
489	{
490	/* we need more bits; we have to do it by hand */
491	FT_UInt32 c;
492
493
494	q = ( a / b ) << 16;
495	c = a % b;
496
497	/* we must compute C0x10000/B: we simply shift C and B so /
498	/* C becomes smaller than 16 bits */
499	while ( c >> 16 )
500	{
501	c >>= 1;
502	b <<= 1;
503	}
504
505	q += ( c << 16 ) / b;
506	}
507
508	return ( s < 0 ? -(FT_Int32)q : (FT_Int32)q );
509	}
510
511
512	/*************************************************************************/
513	/* */
514	/* <Function> */
515	/* FT_Add64 */
516	/* */
517	/* <Description> */
518	/* Add two Int64 values. */
519	/* */
520	/* <Input> */
521	/* x :: A pointer to the first value to be added. */
522	/* y :: A pointer to the second value to be added. */
523	/* */
524	/* <Output> */
525	/* z :: A pointer to the result of `x + y'. */
526	/* */
527	/* <Note> */
528	/* Will be wrapped by the ADD_64() macro. */
529	/* */
530	FT_EXPORT_FUNC( void ) FT_Add64( FT_Int64* x,
531	FT_Int64* y,
532	FT_Int64* z )
533	{
534	register FT_UInt32 lo, hi;
535
536
537	lo = x->lo + y->lo;
538	hi = x->hi + y->hi + ( lo < x->lo );
539
540	z->lo = lo;
541	z->hi = hi;
542	}
543
544
545	/*************************************************************************/
546	/* */
547	/* <Function> */
548	/* FT_MulTo64 */
549	/* */
550	/* <Description> */
551	/* Multiplies two Int32 integers. Returns an Int64 integer. */
552	/* */
553	/* <Input> */
554	/* x :: The first multiplier. */
555	/* y :: The second multiplier. */
556	/* */
557	/* <Output> */
558	/* z :: A pointer to the result of `x * y'. */
559	/* */
560	/* <Note> */
561	/* Will be wrapped by the MUL_64() macro. */
562	/* */
563	FT_EXPORT_FUNC( void ) FT_MulTo64( FT_Int32 x,
564	FT_Int32 y,
565	FT_Int64* z )
566	{
567	FT_Int32 s;
568
569
570	s = x; x = ABS( x );
571	s ^= y; y = ABS( y );
572
573	{
574	FT_UInt32 lo1, hi1, lo2, hi2, lo, hi, i1, i2;
575
576
577	lo1 = x & 0x0000FFFF; hi1 = x >> 16;
578	lo2 = y & 0x0000FFFF; hi2 = y >> 16;
579
580	lo = lo1 * lo2;
581	i1 = lo1 * hi2;
582	i2 = lo2 * hi1;
583	hi = hi1 * hi2;
584
585	/* Check carry overflow of i1 + i2 */
586	i1 += i2;
587	if ( i1 < i2 )
588	hi += 1L << 16;
589
590	hi += i1 >> 16;
591	i1 = i1 << 16;
592
593	/* Check carry overflow of i1 + lo */
594	lo += i1;
595	hi += ( lo < i1 );
596
597	z->lo = lo;
598	z->hi = hi;
599	}
600
601	if ( s < 0 )
602	{
603	z->lo = (FT_UInt32)-(FT_Int32)z->lo;
604	z->hi = ~z->hi + !( z->lo );
605	}
606	}
607
608
609	/*************************************************************************/
610	/* */
611	/* <Function> */
612	/* FT_Div64by32 */
613	/* */
614	/* <Description> */
615	/* Divides an Int64 value by an Int32 value. Returns an Int32 */
616	/* integer. */
617	/* */
618	/* <Input> */
619	/* x :: A pointer to the dividend. */
620	/* y :: The divisor. */
621	/* */
622	/* <Return> */
623	/* The result of `x / y'. */
624	/* */
625	/* <Note> */
626	/* Will be wrapped by the DIV_64() macro. */
627	/* */
628	FT_EXPORT_FUNC( FT_Int32 ) FT_Div64by32( FT_Int64* x,
629	FT_Int32 y )
630	{
631	FT_Int32 s;
632	FT_UInt32 q, r, i, lo;
633
634
635	s = x->hi;
636	if ( s < 0 )
637	{
638	x->lo = (FT_UInt32)-(FT_Int32)x->lo;
639	x->hi = ~x->hi + !( x->lo );
640	}
641	s ^= y; y = ABS( y );
642
643	/* Shortcut */
644	if ( x->hi == 0 )
645	{
646	if ( y > 0 )
647	q = x->lo / y;
648	else
649	q = 0x7FFFFFFFL;
650
651	return ( s < 0 ? -(FT_Int32)q : (FT_Int32)q );
652	}
653
654	r = x->hi;
655	lo = x->lo;
656
657	if ( r >= (FT_UInt32)y ) /* we know y is to be treated as unsigned here */
658	return ( s < 0 ? 0x80000001UL : 0x7FFFFFFFUL );
659	/* Return Max/Min Int32 if division overflow. */
660	/* This includes division by zero! */
661	q = 0;
662	for ( i = 0; i < 32; i++ )
663	{
664	r <<= 1;
665	q <<= 1;
666	r \|= lo >> 31;
667
668	if ( r >= (FT_UInt32)y )
669	{
670	r -= y;
671	q \|= 1;
672	}
673	lo <<= 1;
674	}
675
676	return ( s < 0 ? -(FT_Int32)q : (FT_Int32)q );
677	}
678
679
680	#ifdef FT_CONFIG_OPTION_OLD_CALCS
681
682
683	/* two helper functions for FT_Sqrt64() */
684
685	static
686	void FT_Sub64( FT_Int64* x,
687	FT_Int64* y,
688	FT_Int64* z )
689	{
690	register FT_UInt32 lo, hi;
691
692
693	lo = x->lo - y->lo;
694	hi = x->hi - y->hi - ( (FT_Int32)lo < 0 );
695
696	z->lo = lo;
697	z->hi = hi;
698	}
699
700
701	static
702	int ft_order64( FT_Int64* z )
703	{
704	FT_UInt32 i;
705	int j;
706
707
708	i = z->lo;
709	j = 0;
710	if ( z->hi )
711	{
712	i = z->hi;
713	j = 32;
714	}
715
716	while ( i > 0 )
717	{
718	i >>= 1;
719	j++;
720	}
721	return j - 1;
722	}
723
724
725	/*************************************************************************/
726	/* */
727	/* <Function> */
728	/* FT_Sqrt64 */
729	/* */
730	/* <Description> */
731	/* Computes the square root of a 64-bits value. That sounds stupid, */
732	/* but it is needed to obtain maximal accuracy in the TrueType */
733	/* bytecode interpreter. */
734	/* */
735	/* <Input> */
736	/* z :: A pointer to a 64-bit integer. */
737	/* */
738	/* <Return> */
739	/* The 32-bit square-root. */
740	/* */
741	FT_EXPORT_FUNC( FT_Int32 ) FT_Sqrt64( FT_Int64* l )
742	{
743	FT_Int64 l2;
744	FT_Int32 r, s;
745
746
747	if ( (FT_Int32)l->hi < 0 \|\|
748	( l->hi == 0 && l->lo == 0 ) )
749	return 0;
750
751	s = ft_order64( l );
752	if ( s == 0 )
753	return 1;
754
755	r = ft_square_roots[s];
756	do
757	{
758	s = r;
759	r = ( r + FT_Div64by32( l, r ) ) >> 1;
760	FT_MulTo64( r, r, &l2 );
761	FT_Sub64 ( l, &l2, &l2 );
762
763	} while ( r > s \|\| (FT_Int32)l2.hi < 0 );
764
765	return r;
766	}
767
768	#endif /* FT_CONFIG_OPTION_OLD_CALCS */
769
770	#endif /* FT_LONG64 */
771
772
773	/* END */