1 files changed, 231 insertions, 0 deletions
diff --git a/benchmarks/CHStone/jpeg/chenidct.c b/benchmarks/CHStone/jpeg/chenidct.c
new file mode 100755
index 0000000..1e0278e
--- /dev/null
+++ b/benchmarks/CHStone/jpeg/chenidct.c
@@ -0,0 +1,231 @@
+/*
++--------------------------------------------------------------------------+
+| CHStone : A suite of Benchmark Programs for C-based High-Level Synthesis |
+| ======================================================================== |
+|                                                                          |
+| * Collected and Modified : Y. Hara, H. Tomiyama, S. Honda,               |
+|                            H. Takada and K. Ishii                        |
+|                            Nagoya University, Japan                      |
+|                                                                          |
+| * Remarks :                                                              |
+|    1. This source code is reformatted to follow CHStone's style.         |
+|    2. Test vectors are added for CHStone.                                |
+|    3. If "main_result" is 0 at the end of the program, the program is    |
+|       successfully executed.                                             |
+|    4. Follow the copyright of each benchmark program.                    |
++--------------------------------------------------------------------------+
+*/
+/*
+ *  IDCT transformation of Chen algorithm
+ *
+ *  @(#) $Id: chenidct.c,v 1.2 2003/07/18 10:19:21 honda Exp $
+ */
+/*************************************************************
+Copyright (C) 1990, 1991, 1993 Andy C. Hung, all rights reserved.
+PUBLIC DOMAIN LICENSE: Stanford University Portable Video Research
+Group. If you use this software, you agree to the following: This
+program package is purely experimental, and is licensed "as is".
+Permission is granted to use, modify, and distribute this program
+without charge for any purpose, provided this license/ disclaimer
+notice appears in the copies.  No warranty or maintenance is given,
+either expressed or implied.  In no event shall the author(s) be
+liable to you or a third party for any special, incidental,
+consequential, or other damages, arising out of the use or inability
+to use the program for any purpose (or the loss of data), even if we
+have been advised of such possibilities.  Any public reference or
+advertisement of this source code should refer to it as the Portable
+Video Research Group (PVRG) code, and not by any author(s) (or
+Stanford University) name.
+*************************************************************/
+/*
+************************************************************
+chendct.c
+
+A simple DCT algorithm that seems to have fairly nice arithmetic
+properties.
+
+W. H. Chen, C. H. Smith and S. C. Fralick "A fast computational
+algorithm for the discrete cosine transform," IEEE Trans. Commun.,
+vol. COM-25, pp. 1004-1009, Sept 1977.
+
+************************************************************
+*/
+
+#define LS(r,s) ((r) << (s))
+#define RS(r,s) ((r) >> (s))	/* Caution with rounding... */
+
+#define MSCALE(expr)  RS((expr),9)
+
+/* Cos constants */
+
+#define c1d4 362L
+
+#define c1d8 473L
+#define c3d8 196L
+
+#define c1d16 502L
+#define c3d16 426L
+#define c5d16 284L
+#define c7d16 100L
+
+
+/*
+ *
+ * ChenIDCT() implements the Chen inverse dct. Note that there are two
+ * input vectors that represent x=input, and y=output, and must be
+ * defined (and storage allocated) before this routine is called.
+ */
+void
+ChenIDct (int *x, int *y)
+{
+  register int i;
+  register int *aptr;
+  register int a0, a1, a2, a3;
+  register int b0, b1, b2, b3;
+  register int c0, c1, c2, c3;
+
+  /* Loop over columns */
+
+  for (i = 0; i < 8; i++)
+    {
+      aptr = x + i;
+      b0 = LS (*aptr, 2);
+      aptr += 8;
+      a0 = LS (*aptr, 2);
+      aptr += 8;
+      b2 = LS (*aptr, 2);
+      aptr += 8;
+      a1 = LS (*aptr, 2);
+      aptr += 8;
+      b1 = LS (*aptr, 2);
+      aptr += 8;
+      a2 = LS (*aptr, 2);
+      aptr += 8;
+      b3 = LS (*aptr, 2);
+      aptr += 8;
+      a3 = LS (*aptr, 2);
+
+      /* Split into even mode  b0 = x0  b1 = x4  b2 = x2  b3 = x6.
+         And the odd terms a0 = x1 a1 = x3 a2 = x5 a3 = x7.
+       */
+
+      c0 = MSCALE ((c7d16 * a0) - (c1d16 * a3));
+      c1 = MSCALE ((c3d16 * a2) - (c5d16 * a1));
+      c2 = MSCALE ((c3d16 * a1) + (c5d16 * a2));
+      c3 = MSCALE ((c1d16 * a0) + (c7d16 * a3));
+
+      /* First Butterfly on even terms. */
+
+      a0 = MSCALE (c1d4 * (b0 + b1));
+      a1 = MSCALE (c1d4 * (b0 - b1));
+
+      a2 = MSCALE ((c3d8 * b2) - (c1d8 * b3));
+      a3 = MSCALE ((c1d8 * b2) + (c3d8 * b3));
+
+      b0 = a0 + a3;
+      b1 = a1 + a2;
+      b2 = a1 - a2;
+      b3 = a0 - a3;
+
+      /* Second Butterfly */
+
+      a0 = c0 + c1;
+      a1 = c0 - c1;
+      a2 = c3 - c2;
+      a3 = c3 + c2;
+
+      c0 = a0;
+      c1 = MSCALE (c1d4 * (a2 - a1));
+      c2 = MSCALE (c1d4 * (a2 + a1));
+      c3 = a3;
+
+      aptr = y + i;
+      *aptr = b0 + c3;
+      aptr += 8;
+      *aptr = b1 + c2;
+      aptr += 8;
+      *aptr = b2 + c1;
+      aptr += 8;
+      *aptr = b3 + c0;
+      aptr += 8;
+      *aptr = b3 - c0;
+      aptr += 8;
+      *aptr = b2 - c1;
+      aptr += 8;
+      *aptr = b1 - c2;
+      aptr += 8;
+      *aptr = b0 - c3;
+    }
+
+  /* Loop over rows */
+
+  for (i = 0; i < 8; i++)
+    {
+      aptr = y + LS (i, 3);
+      b0 = *(aptr++);
+      a0 = *(aptr++);
+      b2 = *(aptr++);
+      a1 = *(aptr++);
+      b1 = *(aptr++);
+      a2 = *(aptr++);
+      b3 = *(aptr++);
+      a3 = *(aptr);
+
+      /*
+         Split into even mode  b0 = x0  b1 = x4  b2 = x2  b3 = x6.
+         And the odd terms a0 = x1 a1 = x3 a2 = x5 a3 = x7.
+       */
+
+      c0 = MSCALE ((c7d16 * a0) - (c1d16 * a3));
+      c1 = MSCALE ((c3d16 * a2) - (c5d16 * a1));
+      c2 = MSCALE ((c3d16 * a1) + (c5d16 * a2));
+      c3 = MSCALE ((c1d16 * a0) + (c7d16 * a3));
+
+      /* First Butterfly on even terms. */
+
+      a0 = MSCALE (c1d4 * (b0 + b1));
+      a1 = MSCALE (c1d4 * (b0 - b1));
+
+      a2 = MSCALE ((c3d8 * b2) - (c1d8 * b3));
+      a3 = MSCALE ((c1d8 * b2) + (c3d8 * b3));
+
+      /* Calculate last set of b's */
+
+      b0 = a0 + a3;
+      b1 = a1 + a2;
+      b2 = a1 - a2;
+      b3 = a0 - a3;
+
+      /* Second Butterfly */
+
+      a0 = c0 + c1;
+      a1 = c0 - c1;
+      a2 = c3 - c2;
+      a3 = c3 + c2;
+
+      c0 = a0;
+      c1 = MSCALE (c1d4 * (a2 - a1));
+      c2 = MSCALE (c1d4 * (a2 + a1));
+      c3 = a3;
+
+      aptr = y + LS (i, 3);
+      *(aptr++) = b0 + c3;
+      *(aptr++) = b1 + c2;
+      *(aptr++) = b2 + c1;
+      *(aptr++) = b3 + c0;
+      *(aptr++) = b3 - c0;
+      *(aptr++) = b2 - c1;
+      *(aptr++) = b1 - c2;
+      *(aptr) = b0 - c3;
+    }
+
+  /*
+     Retrieve correct accuracy. We have additional factor
+     of 16 that must be removed.
+   */
+
+  for (i = 0, aptr = y; i < 64; i++, aptr++)
+    *aptr = (((*aptr < 0) ? (*aptr - 8) : (*aptr + 8)) / 16);
+}
+
+ /*END*/