cscg22-gearboy

CSCG 2022 Challenge 'Gearboy'
git clone https://git.sinitax.com/sinitax/cscg22-gearboy
Log | Files | Refs | sfeed.txt

_mullong.c (3174B)


      1/*-------------------------------------------------------------------------
      2   _mullong.c - routine for multiplication of 32 bit (unsigned) long
      3
      4   Copyright (C) 1999, Sandeep Dutta . sandeep.dutta@usa.net
      5   Copyright (C) 1999, Jean Louis VERN jlvern@writeme.com
      6
      7   This library is free software; you can redistribute it and/or modify it
      8   under the terms of the GNU General Public License as published by the
      9   Free Software Foundation; either version 2, or (at your option) any
     10   later version.
     11
     12   This library is distributed in the hope that it will be useful,
     13   but WITHOUT ANY WARRANTY; without even the implied warranty of
     14   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
     15   GNU General Public License for more details.
     16
     17   You should have received a copy of the GNU General Public License
     18   along with this library; see the file COPYING. If not, write to the
     19   Free Software Foundation, 51 Franklin Street, Fifth Floor, Boston,
     20   MA 02110-1301, USA.
     21
     22   As a special exception, if you link this library with other files,
     23   some of which are compiled with SDCC, to produce an executable,
     24   this library does not by itself cause the resulting executable to
     25   be covered by the GNU General Public License. This exception does
     26   not however invalidate any other reasons why the executable file
     27   might be covered by the GNU General Public License.
     28-------------------------------------------------------------------------*/
     29
     30
     31struct some_struct {
     32	short a ;
     33	char b;
     34	long c ;};
     35union bil {
     36        struct {unsigned char b0,b1,b2,b3 ;} b;
     37        struct {unsigned short lo,hi ;} i;
     38        unsigned long l;
     39        struct { unsigned char b0; unsigned short i12; unsigned char b3;} bi;
     40} ;
     41
     42#define bcast(x) ((union bil *)&(x))
     43
     44/*
     45                     3   2   1   0
     46       X             3   2   1   0
     47       ----------------------------
     48                   0.3 0.2 0.1 0.0
     49               1.3 1.2 1.1 1.0
     50           2.3 2.2 2.1 2.0
     51       3.3 3.2 3.1 3.0
     52       ----------------------------
     53                  |3.3|1.3|0.2|0.0|   A
     54                    |2.3|0.3|0.1|     B
     55                    |3.2|1.2|1.0|     C
     56                      |2.2|1.1|       D
     57                      |3.1|2.0|       E
     58                        |2.1|         F
     59                        |3.0|         G
     60                          |-------> only this side 32 x 32 -> 32
     61*/
     62
     63/* 32x32->32 multiplication to be used
     64   if 16x16->16 is faster than three 8x8->16.
     65   2009, by M.Bodrato ( http://bodrato.it/ )
     66
     67   z80 and sm83 don't have any hardware multiplication.
     68   r2k and r3k have 16x16 hardware multiplication.
     69 */
     70long _mullong (long a, long b)
     71{
     72  unsigned short i12;
     73
     74  bcast(a)->i.hi *= bcast(b)->i.lo;
     75  bcast(a)->i.hi += bcast(b)->i.hi * bcast(a)->i.lo;
     76
     77  /* only (a->i.lo * b->i.lo) 16x16->32 to do. asm? */
     78  bcast(a)->i.hi += bcast(a)->b.b1 * bcast(b)->b.b1;
     79
     80  i12 = bcast(b)->b.b0 * bcast(a)->b.b1;
     81  bcast(b)->bi.i12 = bcast(a)->b.b0 * bcast(b)->b.b1;
     82
     83  /* add up the two partial result, store carry in b3 */
     84  bcast(b)->b.b3 = ((bcast(b)->bi.i12 += i12) < i12);
     85
     86  bcast(a)->i.lo  = bcast(a)->b.b0 * bcast(b)->b.b0;
     87
     88  bcast(b)->bi.b0 = 0;
     89
     90  return a + b;
     91}