Merge tag '1.0.2+2017.04.10.git.ea75cdf' into debian/unstable
tag 1.0.2+2017.04.10.git.ea75cdf from upstream/mastermaster
|
@ -1,5 +1,78 @@
|
|||
.deps
|
||||
.libs
|
||||
.dirstamp
|
||||
*.lo
|
||||
Makefile
|
||||
Makefile.in
|
||||
/autom4te.cache
|
||||
/aclocal.m4
|
||||
/compile
|
||||
/configure
|
||||
/depcomp
|
||||
/install-sh
|
||||
/missing
|
||||
include/config.h
|
||||
include/config.h.in
|
||||
include/config.h.in~
|
||||
include/stamp-h1
|
||||
|
||||
# Object files
|
||||
*.o
|
||||
*.ko
|
||||
*.obj
|
||||
*.elf
|
||||
|
||||
# Libraries
|
||||
*.lib
|
||||
*.la
|
||||
*.a
|
||||
|
||||
# Shared objects (inc. Windows DLLs)
|
||||
*.dll
|
||||
*.lo
|
||||
*.so
|
||||
*.so.*
|
||||
*.dylib
|
||||
|
||||
# Executables
|
||||
*.exe
|
||||
*.out
|
||||
*.app
|
||||
*.i*86
|
||||
*.x86_64
|
||||
*.hex
|
||||
|
||||
# Other stuff
|
||||
.deps/
|
||||
.libs/
|
||||
/config.log
|
||||
/config.status
|
||||
/libtool
|
||||
INSTALL
|
||||
config.guess
|
||||
config.sub
|
||||
ltmain.sh
|
||||
m4/libtool.m4
|
||||
m4/ltversion.m4
|
||||
m4/ltoptions.m4
|
||||
m4/ltsugar.m4
|
||||
m4/lt~obsolete.m4
|
||||
test-driver
|
||||
src/.dirstamp
|
||||
test-driver
|
||||
|
||||
examples/gf_example_1
|
||||
examples/gf_example_2
|
||||
examples/gf_example_3
|
||||
examples/gf_example_4
|
||||
examples/gf_example_5
|
||||
examples/gf_example_6
|
||||
examples/gf_example_7
|
||||
test/gf_unit
|
||||
tools/gf_add
|
||||
tools/gf_div
|
||||
tools/gf_inline_time
|
||||
tools/gf_methods
|
||||
tools/gf_mult
|
||||
tools/gf_poly
|
||||
tools/gf_time
|
||||
tools/gf_unit_w*
|
||||
tools/test-suite.log
|
||||
tools/.qemu/
|
||||
tools/test_simd*.results*
|
||||
|
|
370
INSTALL
|
@ -1,370 +0,0 @@
|
|||
Installation Instructions
|
||||
*************************
|
||||
|
||||
Copyright (C) 1994-1996, 1999-2002, 2004-2013 Free Software Foundation,
|
||||
Inc.
|
||||
|
||||
Copying and distribution of this file, with or without modification,
|
||||
are permitted in any medium without royalty provided the copyright
|
||||
notice and this notice are preserved. This file is offered as-is,
|
||||
without warranty of any kind.
|
||||
|
||||
Basic Installation
|
||||
==================
|
||||
|
||||
Briefly, the shell command `./configure && make && make install'
|
||||
should configure, build, and install this package. The following
|
||||
more-detailed instructions are generic; see the `README' file for
|
||||
instructions specific to this package. Some packages provide this
|
||||
`INSTALL' file but do not implement all of the features documented
|
||||
below. The lack of an optional feature in a given package is not
|
||||
necessarily a bug. More recommendations for GNU packages can be found
|
||||
in *note Makefile Conventions: (standards)Makefile Conventions.
|
||||
|
||||
The `configure' shell script attempts to guess correct values for
|
||||
various system-dependent variables used during compilation. It uses
|
||||
those values to create a `Makefile' in each directory of the package.
|
||||
It may also create one or more `.h' files containing system-dependent
|
||||
definitions. Finally, it creates a shell script `config.status' that
|
||||
you can run in the future to recreate the current configuration, and a
|
||||
file `config.log' containing compiler output (useful mainly for
|
||||
debugging `configure').
|
||||
|
||||
It can also use an optional file (typically called `config.cache'
|
||||
and enabled with `--cache-file=config.cache' or simply `-C') that saves
|
||||
the results of its tests to speed up reconfiguring. Caching is
|
||||
disabled by default to prevent problems with accidental use of stale
|
||||
cache files.
|
||||
|
||||
If you need to do unusual things to compile the package, please try
|
||||
to figure out how `configure' could check whether to do them, and mail
|
||||
diffs or instructions to the address given in the `README' so they can
|
||||
be considered for the next release. If you are using the cache, and at
|
||||
some point `config.cache' contains results you don't want to keep, you
|
||||
may remove or edit it.
|
||||
|
||||
The file `configure.ac' (or `configure.in') is used to create
|
||||
`configure' by a program called `autoconf'. You need `configure.ac' if
|
||||
you want to change it or regenerate `configure' using a newer version
|
||||
of `autoconf'.
|
||||
|
||||
The simplest way to compile this package is:
|
||||
|
||||
1. `cd' to the directory containing the package's source code and type
|
||||
`./configure' to configure the package for your system.
|
||||
|
||||
Running `configure' might take a while. While running, it prints
|
||||
some messages telling which features it is checking for.
|
||||
|
||||
2. Type `make' to compile the package.
|
||||
|
||||
3. Optionally, type `make check' to run any self-tests that come with
|
||||
the package, generally using the just-built uninstalled binaries.
|
||||
|
||||
4. Type `make install' to install the programs and any data files and
|
||||
documentation. When installing into a prefix owned by root, it is
|
||||
recommended that the package be configured and built as a regular
|
||||
user, and only the `make install' phase executed with root
|
||||
privileges.
|
||||
|
||||
5. Optionally, type `make installcheck' to repeat any self-tests, but
|
||||
this time using the binaries in their final installed location.
|
||||
This target does not install anything. Running this target as a
|
||||
regular user, particularly if the prior `make install' required
|
||||
root privileges, verifies that the installation completed
|
||||
correctly.
|
||||
|
||||
6. You can remove the program binaries and object files from the
|
||||
source code directory by typing `make clean'. To also remove the
|
||||
files that `configure' created (so you can compile the package for
|
||||
a different kind of computer), type `make distclean'. There is
|
||||
also a `make maintainer-clean' target, but that is intended mainly
|
||||
for the package's developers. If you use it, you may have to get
|
||||
all sorts of other programs in order to regenerate files that came
|
||||
with the distribution.
|
||||
|
||||
7. Often, you can also type `make uninstall' to remove the installed
|
||||
files again. In practice, not all packages have tested that
|
||||
uninstallation works correctly, even though it is required by the
|
||||
GNU Coding Standards.
|
||||
|
||||
8. Some packages, particularly those that use Automake, provide `make
|
||||
distcheck', which can by used by developers to test that all other
|
||||
targets like `make install' and `make uninstall' work correctly.
|
||||
This target is generally not run by end users.
|
||||
|
||||
Compilers and Options
|
||||
=====================
|
||||
|
||||
Some systems require unusual options for compilation or linking that
|
||||
the `configure' script does not know about. Run `./configure --help'
|
||||
for details on some of the pertinent environment variables.
|
||||
|
||||
You can give `configure' initial values for configuration parameters
|
||||
by setting variables in the command line or in the environment. Here
|
||||
is an example:
|
||||
|
||||
./configure CC=c99 CFLAGS=-g LIBS=-lposix
|
||||
|
||||
*Note Defining Variables::, for more details.
|
||||
|
||||
Compiling For Multiple Architectures
|
||||
====================================
|
||||
|
||||
You can compile the package for more than one kind of computer at the
|
||||
same time, by placing the object files for each architecture in their
|
||||
own directory. To do this, you can use GNU `make'. `cd' to the
|
||||
directory where you want the object files and executables to go and run
|
||||
the `configure' script. `configure' automatically checks for the
|
||||
source code in the directory that `configure' is in and in `..'. This
|
||||
is known as a "VPATH" build.
|
||||
|
||||
With a non-GNU `make', it is safer to compile the package for one
|
||||
architecture at a time in the source code directory. After you have
|
||||
installed the package for one architecture, use `make distclean' before
|
||||
reconfiguring for another architecture.
|
||||
|
||||
On MacOS X 10.5 and later systems, you can create libraries and
|
||||
executables that work on multiple system types--known as "fat" or
|
||||
"universal" binaries--by specifying multiple `-arch' options to the
|
||||
compiler but only a single `-arch' option to the preprocessor. Like
|
||||
this:
|
||||
|
||||
./configure CC="gcc -arch i386 -arch x86_64 -arch ppc -arch ppc64" \
|
||||
CXX="g++ -arch i386 -arch x86_64 -arch ppc -arch ppc64" \
|
||||
CPP="gcc -E" CXXCPP="g++ -E"
|
||||
|
||||
This is not guaranteed to produce working output in all cases, you
|
||||
may have to build one architecture at a time and combine the results
|
||||
using the `lipo' tool if you have problems.
|
||||
|
||||
Installation Names
|
||||
==================
|
||||
|
||||
By default, `make install' installs the package's commands under
|
||||
`/usr/local/bin', include files under `/usr/local/include', etc. You
|
||||
can specify an installation prefix other than `/usr/local' by giving
|
||||
`configure' the option `--prefix=PREFIX', where PREFIX must be an
|
||||
absolute file name.
|
||||
|
||||
You can specify separate installation prefixes for
|
||||
architecture-specific files and architecture-independent files. If you
|
||||
pass the option `--exec-prefix=PREFIX' to `configure', the package uses
|
||||
PREFIX as the prefix for installing programs and libraries.
|
||||
Documentation and other data files still use the regular prefix.
|
||||
|
||||
In addition, if you use an unusual directory layout you can give
|
||||
options like `--bindir=DIR' to specify different values for particular
|
||||
kinds of files. Run `configure --help' for a list of the directories
|
||||
you can set and what kinds of files go in them. In general, the
|
||||
default for these options is expressed in terms of `${prefix}', so that
|
||||
specifying just `--prefix' will affect all of the other directory
|
||||
specifications that were not explicitly provided.
|
||||
|
||||
The most portable way to affect installation locations is to pass the
|
||||
correct locations to `configure'; however, many packages provide one or
|
||||
both of the following shortcuts of passing variable assignments to the
|
||||
`make install' command line to change installation locations without
|
||||
having to reconfigure or recompile.
|
||||
|
||||
The first method involves providing an override variable for each
|
||||
affected directory. For example, `make install
|
||||
prefix=/alternate/directory' will choose an alternate location for all
|
||||
directory configuration variables that were expressed in terms of
|
||||
`${prefix}'. Any directories that were specified during `configure',
|
||||
but not in terms of `${prefix}', must each be overridden at install
|
||||
time for the entire installation to be relocated. The approach of
|
||||
makefile variable overrides for each directory variable is required by
|
||||
the GNU Coding Standards, and ideally causes no recompilation.
|
||||
However, some platforms have known limitations with the semantics of
|
||||
shared libraries that end up requiring recompilation when using this
|
||||
method, particularly noticeable in packages that use GNU Libtool.
|
||||
|
||||
The second method involves providing the `DESTDIR' variable. For
|
||||
example, `make install DESTDIR=/alternate/directory' will prepend
|
||||
`/alternate/directory' before all installation names. The approach of
|
||||
`DESTDIR' overrides is not required by the GNU Coding Standards, and
|
||||
does not work on platforms that have drive letters. On the other hand,
|
||||
it does better at avoiding recompilation issues, and works well even
|
||||
when some directory options were not specified in terms of `${prefix}'
|
||||
at `configure' time.
|
||||
|
||||
Optional Features
|
||||
=================
|
||||
|
||||
If the package supports it, you can cause programs to be installed
|
||||
with an extra prefix or suffix on their names by giving `configure' the
|
||||
option `--program-prefix=PREFIX' or `--program-suffix=SUFFIX'.
|
||||
|
||||
Some packages pay attention to `--enable-FEATURE' options to
|
||||
`configure', where FEATURE indicates an optional part of the package.
|
||||
They may also pay attention to `--with-PACKAGE' options, where PACKAGE
|
||||
is something like `gnu-as' or `x' (for the X Window System). The
|
||||
`README' should mention any `--enable-' and `--with-' options that the
|
||||
package recognizes.
|
||||
|
||||
For packages that use the X Window System, `configure' can usually
|
||||
find the X include and library files automatically, but if it doesn't,
|
||||
you can use the `configure' options `--x-includes=DIR' and
|
||||
`--x-libraries=DIR' to specify their locations.
|
||||
|
||||
Some packages offer the ability to configure how verbose the
|
||||
execution of `make' will be. For these packages, running `./configure
|
||||
--enable-silent-rules' sets the default to minimal output, which can be
|
||||
overridden with `make V=1'; while running `./configure
|
||||
--disable-silent-rules' sets the default to verbose, which can be
|
||||
overridden with `make V=0'.
|
||||
|
||||
Particular systems
|
||||
==================
|
||||
|
||||
On HP-UX, the default C compiler is not ANSI C compatible. If GNU
|
||||
CC is not installed, it is recommended to use the following options in
|
||||
order to use an ANSI C compiler:
|
||||
|
||||
./configure CC="cc -Ae -D_XOPEN_SOURCE=500"
|
||||
|
||||
and if that doesn't work, install pre-built binaries of GCC for HP-UX.
|
||||
|
||||
HP-UX `make' updates targets which have the same time stamps as
|
||||
their prerequisites, which makes it generally unusable when shipped
|
||||
generated files such as `configure' are involved. Use GNU `make'
|
||||
instead.
|
||||
|
||||
On OSF/1 a.k.a. Tru64, some versions of the default C compiler cannot
|
||||
parse its `<wchar.h>' header file. The option `-nodtk' can be used as
|
||||
a workaround. If GNU CC is not installed, it is therefore recommended
|
||||
to try
|
||||
|
||||
./configure CC="cc"
|
||||
|
||||
and if that doesn't work, try
|
||||
|
||||
./configure CC="cc -nodtk"
|
||||
|
||||
On Solaris, don't put `/usr/ucb' early in your `PATH'. This
|
||||
directory contains several dysfunctional programs; working variants of
|
||||
these programs are available in `/usr/bin'. So, if you need `/usr/ucb'
|
||||
in your `PATH', put it _after_ `/usr/bin'.
|
||||
|
||||
On Haiku, software installed for all users goes in `/boot/common',
|
||||
not `/usr/local'. It is recommended to use the following options:
|
||||
|
||||
./configure --prefix=/boot/common
|
||||
|
||||
Specifying the System Type
|
||||
==========================
|
||||
|
||||
There may be some features `configure' cannot figure out
|
||||
automatically, but needs to determine by the type of machine the package
|
||||
will run on. Usually, assuming the package is built to be run on the
|
||||
_same_ architectures, `configure' can figure that out, but if it prints
|
||||
a message saying it cannot guess the machine type, give it the
|
||||
`--build=TYPE' option. TYPE can either be a short name for the system
|
||||
type, such as `sun4', or a canonical name which has the form:
|
||||
|
||||
CPU-COMPANY-SYSTEM
|
||||
|
||||
where SYSTEM can have one of these forms:
|
||||
|
||||
OS
|
||||
KERNEL-OS
|
||||
|
||||
See the file `config.sub' for the possible values of each field. If
|
||||
`config.sub' isn't included in this package, then this package doesn't
|
||||
need to know the machine type.
|
||||
|
||||
If you are _building_ compiler tools for cross-compiling, you should
|
||||
use the option `--target=TYPE' to select the type of system they will
|
||||
produce code for.
|
||||
|
||||
If you want to _use_ a cross compiler, that generates code for a
|
||||
platform different from the build platform, you should specify the
|
||||
"host" platform (i.e., that on which the generated programs will
|
||||
eventually be run) with `--host=TYPE'.
|
||||
|
||||
Sharing Defaults
|
||||
================
|
||||
|
||||
If you want to set default values for `configure' scripts to share,
|
||||
you can create a site shell script called `config.site' that gives
|
||||
default values for variables like `CC', `cache_file', and `prefix'.
|
||||
`configure' looks for `PREFIX/share/config.site' if it exists, then
|
||||
`PREFIX/etc/config.site' if it exists. Or, you can set the
|
||||
`CONFIG_SITE' environment variable to the location of the site script.
|
||||
A warning: not all `configure' scripts look for a site script.
|
||||
|
||||
Defining Variables
|
||||
==================
|
||||
|
||||
Variables not defined in a site shell script can be set in the
|
||||
environment passed to `configure'. However, some packages may run
|
||||
configure again during the build, and the customized values of these
|
||||
variables may be lost. In order to avoid this problem, you should set
|
||||
them in the `configure' command line, using `VAR=value'. For example:
|
||||
|
||||
./configure CC=/usr/local2/bin/gcc
|
||||
|
||||
causes the specified `gcc' to be used as the C compiler (unless it is
|
||||
overridden in the site shell script).
|
||||
|
||||
Unfortunately, this technique does not work for `CONFIG_SHELL' due to
|
||||
an Autoconf limitation. Until the limitation is lifted, you can use
|
||||
this workaround:
|
||||
|
||||
CONFIG_SHELL=/bin/bash ./configure CONFIG_SHELL=/bin/bash
|
||||
|
||||
`configure' Invocation
|
||||
======================
|
||||
|
||||
`configure' recognizes the following options to control how it
|
||||
operates.
|
||||
|
||||
`--help'
|
||||
`-h'
|
||||
Print a summary of all of the options to `configure', and exit.
|
||||
|
||||
`--help=short'
|
||||
`--help=recursive'
|
||||
Print a summary of the options unique to this package's
|
||||
`configure', and exit. The `short' variant lists options used
|
||||
only in the top level, while the `recursive' variant lists options
|
||||
also present in any nested packages.
|
||||
|
||||
`--version'
|
||||
`-V'
|
||||
Print the version of Autoconf used to generate the `configure'
|
||||
script, and exit.
|
||||
|
||||
`--cache-file=FILE'
|
||||
Enable the cache: use and save the results of the tests in FILE,
|
||||
traditionally `config.cache'. FILE defaults to `/dev/null' to
|
||||
disable caching.
|
||||
|
||||
`--config-cache'
|
||||
`-C'
|
||||
Alias for `--cache-file=config.cache'.
|
||||
|
||||
`--quiet'
|
||||
`--silent'
|
||||
`-q'
|
||||
Do not print messages saying which checks are being made. To
|
||||
suppress all normal output, redirect it to `/dev/null' (any error
|
||||
messages will still be shown).
|
||||
|
||||
`--srcdir=DIR'
|
||||
Look for the package's source code in directory DIR. Usually
|
||||
`configure' can determine that directory automatically.
|
||||
|
||||
`--prefix=DIR'
|
||||
Use DIR as the installation prefix. *note Installation Names::
|
||||
for more details, including other options available for fine-tuning
|
||||
the installation locations.
|
||||
|
||||
`--no-create'
|
||||
`-n'
|
||||
Run the configure checks, but stop before creating any output
|
||||
files.
|
||||
|
||||
`configure' also accepts some other, not widely useful, options. Run
|
||||
`configure --help' for more details.
|
|
@ -6,3 +6,5 @@ ACLOCAL_AMFLAGS = -I m4
|
|||
|
||||
include_HEADERS = include/gf_complete.h include/gf_method.h include/gf_rand.h include/gf_general.h
|
||||
|
||||
# display the output of failed TESTS after a failed make check
|
||||
export VERBOSE = true
|
||||
|
|
859
Makefile.in
|
@ -1,859 +0,0 @@
|
|||
# Makefile.in generated by automake 1.14.1 from Makefile.am.
|
||||
# @configure_input@
|
||||
|
||||
# Copyright (C) 1994-2013 Free Software Foundation, Inc.
|
||||
|
||||
# This Makefile.in is free software; the Free Software Foundation
|
||||
# gives unlimited permission to copy and/or distribute it,
|
||||
# with or without modifications, as long as this notice is preserved.
|
||||
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY, to the extent permitted by law; without
|
||||
# even the implied warranty of MERCHANTABILITY or FITNESS FOR A
|
||||
# PARTICULAR PURPOSE.
|
||||
|
||||
@SET_MAKE@
|
||||
|
||||
# Top-level GF-Complete AM file
|
||||
# Distributes headers
|
||||
|
||||
VPATH = @srcdir@
|
||||
am__is_gnu_make = test -n '$(MAKEFILE_LIST)' && test -n '$(MAKELEVEL)'
|
||||
am__make_running_with_option = \
|
||||
case $${target_option-} in \
|
||||
?) ;; \
|
||||
*) echo "am__make_running_with_option: internal error: invalid" \
|
||||
"target option '$${target_option-}' specified" >&2; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
has_opt=no; \
|
||||
sane_makeflags=$$MAKEFLAGS; \
|
||||
if $(am__is_gnu_make); then \
|
||||
sane_makeflags=$$MFLAGS; \
|
||||
else \
|
||||
case $$MAKEFLAGS in \
|
||||
*\\[\ \ ]*) \
|
||||
bs=\\; \
|
||||
sane_makeflags=`printf '%s\n' "$$MAKEFLAGS" \
|
||||
| sed "s/$$bs$$bs[$$bs $$bs ]*//g"`;; \
|
||||
esac; \
|
||||
fi; \
|
||||
skip_next=no; \
|
||||
strip_trailopt () \
|
||||
{ \
|
||||
flg=`printf '%s\n' "$$flg" | sed "s/$$1.*$$//"`; \
|
||||
}; \
|
||||
for flg in $$sane_makeflags; do \
|
||||
test $$skip_next = yes && { skip_next=no; continue; }; \
|
||||
case $$flg in \
|
||||
*=*|--*) continue;; \
|
||||
-*I) strip_trailopt 'I'; skip_next=yes;; \
|
||||
-*I?*) strip_trailopt 'I';; \
|
||||
-*O) strip_trailopt 'O'; skip_next=yes;; \
|
||||
-*O?*) strip_trailopt 'O';; \
|
||||
-*l) strip_trailopt 'l'; skip_next=yes;; \
|
||||
-*l?*) strip_trailopt 'l';; \
|
||||
-[dEDm]) skip_next=yes;; \
|
||||
-[JT]) skip_next=yes;; \
|
||||
esac; \
|
||||
case $$flg in \
|
||||
*$$target_option*) has_opt=yes; break;; \
|
||||
esac; \
|
||||
done; \
|
||||
test $$has_opt = yes
|
||||
am__make_dryrun = (target_option=n; $(am__make_running_with_option))
|
||||
am__make_keepgoing = (target_option=k; $(am__make_running_with_option))
|
||||
pkgdatadir = $(datadir)/@PACKAGE@
|
||||
pkgincludedir = $(includedir)/@PACKAGE@
|
||||
pkglibdir = $(libdir)/@PACKAGE@
|
||||
pkglibexecdir = $(libexecdir)/@PACKAGE@
|
||||
am__cd = CDPATH="$${ZSH_VERSION+.}$(PATH_SEPARATOR)" && cd
|
||||
install_sh_DATA = $(install_sh) -c -m 644
|
||||
install_sh_PROGRAM = $(install_sh) -c
|
||||
install_sh_SCRIPT = $(install_sh) -c
|
||||
INSTALL_HEADER = $(INSTALL_DATA)
|
||||
transform = $(program_transform_name)
|
||||
NORMAL_INSTALL = :
|
||||
PRE_INSTALL = :
|
||||
POST_INSTALL = :
|
||||
NORMAL_UNINSTALL = :
|
||||
PRE_UNINSTALL = :
|
||||
POST_UNINSTALL = :
|
||||
build_triplet = @build@
|
||||
host_triplet = @host@
|
||||
subdir = .
|
||||
DIST_COMMON = INSTALL NEWS README AUTHORS ChangeLog \
|
||||
$(srcdir)/Makefile.in $(srcdir)/Makefile.am \
|
||||
$(top_srcdir)/configure $(am__configure_deps) \
|
||||
$(top_srcdir)/include/config.h.in $(include_HEADERS) COPYING \
|
||||
compile config.guess config.sub install-sh missing ltmain.sh
|
||||
ACLOCAL_M4 = $(top_srcdir)/aclocal.m4
|
||||
am__aclocal_m4_deps = $(top_srcdir)/m4/ax_check_compile_flag.m4 \
|
||||
$(top_srcdir)/m4/ax_ext.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_avx_xgetbv.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_cpuid.m4 \
|
||||
$(top_srcdir)/m4/libtool.m4 $(top_srcdir)/m4/ltoptions.m4 \
|
||||
$(top_srcdir)/m4/ltsugar.m4 $(top_srcdir)/m4/ltversion.m4 \
|
||||
$(top_srcdir)/m4/lt~obsolete.m4 $(top_srcdir)/configure.ac
|
||||
am__configure_deps = $(am__aclocal_m4_deps) $(CONFIGURE_DEPENDENCIES) \
|
||||
$(ACLOCAL_M4)
|
||||
am__CONFIG_DISTCLEAN_FILES = config.status config.cache config.log \
|
||||
configure.lineno config.status.lineno
|
||||
mkinstalldirs = $(install_sh) -d
|
||||
CONFIG_HEADER = $(top_builddir)/include/config.h
|
||||
CONFIG_CLEAN_FILES =
|
||||
CONFIG_CLEAN_VPATH_FILES =
|
||||
AM_V_P = $(am__v_P_@AM_V@)
|
||||
am__v_P_ = $(am__v_P_@AM_DEFAULT_V@)
|
||||
am__v_P_0 = false
|
||||
am__v_P_1 = :
|
||||
AM_V_GEN = $(am__v_GEN_@AM_V@)
|
||||
am__v_GEN_ = $(am__v_GEN_@AM_DEFAULT_V@)
|
||||
am__v_GEN_0 = @echo " GEN " $@;
|
||||
am__v_GEN_1 =
|
||||
AM_V_at = $(am__v_at_@AM_V@)
|
||||
am__v_at_ = $(am__v_at_@AM_DEFAULT_V@)
|
||||
am__v_at_0 = @
|
||||
am__v_at_1 =
|
||||
SOURCES =
|
||||
DIST_SOURCES =
|
||||
RECURSIVE_TARGETS = all-recursive check-recursive cscopelist-recursive \
|
||||
ctags-recursive dvi-recursive html-recursive info-recursive \
|
||||
install-data-recursive install-dvi-recursive \
|
||||
install-exec-recursive install-html-recursive \
|
||||
install-info-recursive install-pdf-recursive \
|
||||
install-ps-recursive install-recursive installcheck-recursive \
|
||||
installdirs-recursive pdf-recursive ps-recursive \
|
||||
tags-recursive uninstall-recursive
|
||||
am__can_run_installinfo = \
|
||||
case $$AM_UPDATE_INFO_DIR in \
|
||||
n|no|NO) false;; \
|
||||
*) (install-info --version) >/dev/null 2>&1;; \
|
||||
esac
|
||||
am__vpath_adj_setup = srcdirstrip=`echo "$(srcdir)" | sed 's|.|.|g'`;
|
||||
am__vpath_adj = case $$p in \
|
||||
$(srcdir)/*) f=`echo "$$p" | sed "s|^$$srcdirstrip/||"`;; \
|
||||
*) f=$$p;; \
|
||||
esac;
|
||||
am__strip_dir = f=`echo $$p | sed -e 's|^.*/||'`;
|
||||
am__install_max = 40
|
||||
am__nobase_strip_setup = \
|
||||
srcdirstrip=`echo "$(srcdir)" | sed 's/[].[^$$\\*|]/\\\\&/g'`
|
||||
am__nobase_strip = \
|
||||
for p in $$list; do echo "$$p"; done | sed -e "s|$$srcdirstrip/||"
|
||||
am__nobase_list = $(am__nobase_strip_setup); \
|
||||
for p in $$list; do echo "$$p $$p"; done | \
|
||||
sed "s| $$srcdirstrip/| |;"' / .*\//!s/ .*/ ./; s,\( .*\)/[^/]*$$,\1,' | \
|
||||
$(AWK) 'BEGIN { files["."] = "" } { files[$$2] = files[$$2] " " $$1; \
|
||||
if (++n[$$2] == $(am__install_max)) \
|
||||
{ print $$2, files[$$2]; n[$$2] = 0; files[$$2] = "" } } \
|
||||
END { for (dir in files) print dir, files[dir] }'
|
||||
am__base_list = \
|
||||
sed '$$!N;$$!N;$$!N;$$!N;$$!N;$$!N;$$!N;s/\n/ /g' | \
|
||||
sed '$$!N;$$!N;$$!N;$$!N;s/\n/ /g'
|
||||
am__uninstall_files_from_dir = { \
|
||||
test -z "$$files" \
|
||||
|| { test ! -d "$$dir" && test ! -f "$$dir" && test ! -r "$$dir"; } \
|
||||
|| { echo " ( cd '$$dir' && rm -f" $$files ")"; \
|
||||
$(am__cd) "$$dir" && rm -f $$files; }; \
|
||||
}
|
||||
am__installdirs = "$(DESTDIR)$(includedir)"
|
||||
HEADERS = $(include_HEADERS)
|
||||
RECURSIVE_CLEAN_TARGETS = mostlyclean-recursive clean-recursive \
|
||||
distclean-recursive maintainer-clean-recursive
|
||||
am__recursive_targets = \
|
||||
$(RECURSIVE_TARGETS) \
|
||||
$(RECURSIVE_CLEAN_TARGETS) \
|
||||
$(am__extra_recursive_targets)
|
||||
AM_RECURSIVE_TARGETS = $(am__recursive_targets:-recursive=) TAGS CTAGS \
|
||||
cscope distdir dist dist-all distcheck
|
||||
am__tagged_files = $(HEADERS) $(SOURCES) $(TAGS_FILES) $(LISP)
|
||||
# Read a list of newline-separated strings from the standard input,
|
||||
# and print each of them once, without duplicates. Input order is
|
||||
# *not* preserved.
|
||||
am__uniquify_input = $(AWK) '\
|
||||
BEGIN { nonempty = 0; } \
|
||||
{ items[$$0] = 1; nonempty = 1; } \
|
||||
END { if (nonempty) { for (i in items) print i; }; } \
|
||||
'
|
||||
# Make sure the list of sources is unique. This is necessary because,
|
||||
# e.g., the same source file might be shared among _SOURCES variables
|
||||
# for different programs/libraries.
|
||||
am__define_uniq_tagged_files = \
|
||||
list='$(am__tagged_files)'; \
|
||||
unique=`for i in $$list; do \
|
||||
if test -f "$$i"; then echo $$i; else echo $(srcdir)/$$i; fi; \
|
||||
done | $(am__uniquify_input)`
|
||||
ETAGS = etags
|
||||
CTAGS = ctags
|
||||
CSCOPE = cscope
|
||||
DIST_SUBDIRS = $(SUBDIRS)
|
||||
DISTFILES = $(DIST_COMMON) $(DIST_SOURCES) $(TEXINFOS) $(EXTRA_DIST)
|
||||
distdir = $(PACKAGE)-$(VERSION)
|
||||
top_distdir = $(distdir)
|
||||
am__remove_distdir = \
|
||||
if test -d "$(distdir)"; then \
|
||||
find "$(distdir)" -type d ! -perm -200 -exec chmod u+w {} ';' \
|
||||
&& rm -rf "$(distdir)" \
|
||||
|| { sleep 5 && rm -rf "$(distdir)"; }; \
|
||||
else :; fi
|
||||
am__post_remove_distdir = $(am__remove_distdir)
|
||||
am__relativize = \
|
||||
dir0=`pwd`; \
|
||||
sed_first='s,^\([^/]*\)/.*$$,\1,'; \
|
||||
sed_rest='s,^[^/]*/*,,'; \
|
||||
sed_last='s,^.*/\([^/]*\)$$,\1,'; \
|
||||
sed_butlast='s,/*[^/]*$$,,'; \
|
||||
while test -n "$$dir1"; do \
|
||||
first=`echo "$$dir1" | sed -e "$$sed_first"`; \
|
||||
if test "$$first" != "."; then \
|
||||
if test "$$first" = ".."; then \
|
||||
dir2=`echo "$$dir0" | sed -e "$$sed_last"`/"$$dir2"; \
|
||||
dir0=`echo "$$dir0" | sed -e "$$sed_butlast"`; \
|
||||
else \
|
||||
first2=`echo "$$dir2" | sed -e "$$sed_first"`; \
|
||||
if test "$$first2" = "$$first"; then \
|
||||
dir2=`echo "$$dir2" | sed -e "$$sed_rest"`; \
|
||||
else \
|
||||
dir2="../$$dir2"; \
|
||||
fi; \
|
||||
dir0="$$dir0"/"$$first"; \
|
||||
fi; \
|
||||
fi; \
|
||||
dir1=`echo "$$dir1" | sed -e "$$sed_rest"`; \
|
||||
done; \
|
||||
reldir="$$dir2"
|
||||
DIST_ARCHIVES = $(distdir).tar.gz
|
||||
GZIP_ENV = --best
|
||||
DIST_TARGETS = dist-gzip
|
||||
distuninstallcheck_listfiles = find . -type f -print
|
||||
am__distuninstallcheck_listfiles = $(distuninstallcheck_listfiles) \
|
||||
| sed 's|^\./|$(prefix)/|' | grep -v '$(infodir)/dir$$'
|
||||
distcleancheck_listfiles = find . -type f -print
|
||||
ACLOCAL = @ACLOCAL@
|
||||
AMTAR = @AMTAR@
|
||||
AM_DEFAULT_VERBOSITY = @AM_DEFAULT_VERBOSITY@
|
||||
AR = @AR@
|
||||
AUTOCONF = @AUTOCONF@
|
||||
AUTOHEADER = @AUTOHEADER@
|
||||
AUTOMAKE = @AUTOMAKE@
|
||||
AWK = @AWK@
|
||||
CC = @CC@
|
||||
CCDEPMODE = @CCDEPMODE@
|
||||
CFLAGS = @CFLAGS@
|
||||
CPP = @CPP@
|
||||
CPPFLAGS = @CPPFLAGS@
|
||||
CYGPATH_W = @CYGPATH_W@
|
||||
DEFS = @DEFS@
|
||||
DEPDIR = @DEPDIR@
|
||||
DLLTOOL = @DLLTOOL@
|
||||
DSYMUTIL = @DSYMUTIL@
|
||||
DUMPBIN = @DUMPBIN@
|
||||
ECHO_C = @ECHO_C@
|
||||
ECHO_N = @ECHO_N@
|
||||
ECHO_T = @ECHO_T@
|
||||
EGREP = @EGREP@
|
||||
EXEEXT = @EXEEXT@
|
||||
FGREP = @FGREP@
|
||||
GREP = @GREP@
|
||||
INSTALL = @INSTALL@
|
||||
INSTALL_DATA = @INSTALL_DATA@
|
||||
INSTALL_PROGRAM = @INSTALL_PROGRAM@
|
||||
INSTALL_SCRIPT = @INSTALL_SCRIPT@
|
||||
INSTALL_STRIP_PROGRAM = @INSTALL_STRIP_PROGRAM@
|
||||
LD = @LD@
|
||||
LDFLAGS = @LDFLAGS@
|
||||
LIBOBJS = @LIBOBJS@
|
||||
LIBS = @LIBS@
|
||||
LIBTOOL = @LIBTOOL@
|
||||
LIPO = @LIPO@
|
||||
LN_S = @LN_S@
|
||||
LTLIBOBJS = @LTLIBOBJS@
|
||||
MAINT = @MAINT@
|
||||
MAKEINFO = @MAKEINFO@
|
||||
MANIFEST_TOOL = @MANIFEST_TOOL@
|
||||
MKDIR_P = @MKDIR_P@
|
||||
NM = @NM@
|
||||
NMEDIT = @NMEDIT@
|
||||
OBJDUMP = @OBJDUMP@
|
||||
OBJEXT = @OBJEXT@
|
||||
OTOOL = @OTOOL@
|
||||
OTOOL64 = @OTOOL64@
|
||||
PACKAGE = @PACKAGE@
|
||||
PACKAGE_BUGREPORT = @PACKAGE_BUGREPORT@
|
||||
PACKAGE_NAME = @PACKAGE_NAME@
|
||||
PACKAGE_STRING = @PACKAGE_STRING@
|
||||
PACKAGE_TARNAME = @PACKAGE_TARNAME@
|
||||
PACKAGE_URL = @PACKAGE_URL@
|
||||
PACKAGE_VERSION = @PACKAGE_VERSION@
|
||||
PATH_SEPARATOR = @PATH_SEPARATOR@
|
||||
RANLIB = @RANLIB@
|
||||
SED = @SED@
|
||||
SET_MAKE = @SET_MAKE@
|
||||
SHELL = @SHELL@
|
||||
SIMD_FLAGS = @SIMD_FLAGS@
|
||||
STRIP = @STRIP@
|
||||
VERSION = @VERSION@
|
||||
abs_builddir = @abs_builddir@
|
||||
abs_srcdir = @abs_srcdir@
|
||||
abs_top_builddir = @abs_top_builddir@
|
||||
abs_top_srcdir = @abs_top_srcdir@
|
||||
ac_ct_AR = @ac_ct_AR@
|
||||
ac_ct_CC = @ac_ct_CC@
|
||||
ac_ct_DUMPBIN = @ac_ct_DUMPBIN@
|
||||
am__include = @am__include@
|
||||
am__leading_dot = @am__leading_dot@
|
||||
am__quote = @am__quote@
|
||||
am__tar = @am__tar@
|
||||
am__untar = @am__untar@
|
||||
bindir = @bindir@
|
||||
build = @build@
|
||||
build_alias = @build_alias@
|
||||
build_cpu = @build_cpu@
|
||||
build_os = @build_os@
|
||||
build_vendor = @build_vendor@
|
||||
builddir = @builddir@
|
||||
datadir = @datadir@
|
||||
datarootdir = @datarootdir@
|
||||
docdir = @docdir@
|
||||
dvidir = @dvidir@
|
||||
exec_prefix = @exec_prefix@
|
||||
host = @host@
|
||||
host_alias = @host_alias@
|
||||
host_cpu = @host_cpu@
|
||||
host_os = @host_os@
|
||||
host_vendor = @host_vendor@
|
||||
htmldir = @htmldir@
|
||||
includedir = @includedir@
|
||||
infodir = @infodir@
|
||||
install_sh = @install_sh@
|
||||
libdir = @libdir@
|
||||
libexecdir = @libexecdir@
|
||||
localedir = @localedir@
|
||||
localstatedir = @localstatedir@
|
||||
mandir = @mandir@
|
||||
mkdir_p = @mkdir_p@
|
||||
oldincludedir = @oldincludedir@
|
||||
pdfdir = @pdfdir@
|
||||
prefix = @prefix@
|
||||
program_transform_name = @program_transform_name@
|
||||
psdir = @psdir@
|
||||
sbindir = @sbindir@
|
||||
sharedstatedir = @sharedstatedir@
|
||||
srcdir = @srcdir@
|
||||
sysconfdir = @sysconfdir@
|
||||
target_alias = @target_alias@
|
||||
top_build_prefix = @top_build_prefix@
|
||||
top_builddir = @top_builddir@
|
||||
top_srcdir = @top_srcdir@
|
||||
SUBDIRS = src tools test examples
|
||||
ACLOCAL_AMFLAGS = -I m4
|
||||
include_HEADERS = include/gf_complete.h include/gf_method.h include/gf_rand.h include/gf_general.h
|
||||
all: all-recursive
|
||||
|
||||
.SUFFIXES:
|
||||
am--refresh: Makefile
|
||||
@:
|
||||
$(srcdir)/Makefile.in: @MAINTAINER_MODE_TRUE@ $(srcdir)/Makefile.am $(am__configure_deps)
|
||||
@for dep in $?; do \
|
||||
case '$(am__configure_deps)' in \
|
||||
*$$dep*) \
|
||||
echo ' cd $(srcdir) && $(AUTOMAKE) --gnu'; \
|
||||
$(am__cd) $(srcdir) && $(AUTOMAKE) --gnu \
|
||||
&& exit 0; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
done; \
|
||||
echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu Makefile'; \
|
||||
$(am__cd) $(top_srcdir) && \
|
||||
$(AUTOMAKE) --gnu Makefile
|
||||
.PRECIOUS: Makefile
|
||||
Makefile: $(srcdir)/Makefile.in $(top_builddir)/config.status
|
||||
@case '$?' in \
|
||||
*config.status*) \
|
||||
echo ' $(SHELL) ./config.status'; \
|
||||
$(SHELL) ./config.status;; \
|
||||
*) \
|
||||
echo ' cd $(top_builddir) && $(SHELL) ./config.status $@ $(am__depfiles_maybe)'; \
|
||||
cd $(top_builddir) && $(SHELL) ./config.status $@ $(am__depfiles_maybe);; \
|
||||
esac;
|
||||
|
||||
$(top_builddir)/config.status: $(top_srcdir)/configure $(CONFIG_STATUS_DEPENDENCIES)
|
||||
$(SHELL) ./config.status --recheck
|
||||
|
||||
$(top_srcdir)/configure: @MAINTAINER_MODE_TRUE@ $(am__configure_deps)
|
||||
$(am__cd) $(srcdir) && $(AUTOCONF)
|
||||
$(ACLOCAL_M4): @MAINTAINER_MODE_TRUE@ $(am__aclocal_m4_deps)
|
||||
$(am__cd) $(srcdir) && $(ACLOCAL) $(ACLOCAL_AMFLAGS)
|
||||
$(am__aclocal_m4_deps):
|
||||
|
||||
include/config.h: include/stamp-h1
|
||||
@test -f $@ || rm -f include/stamp-h1
|
||||
@test -f $@ || $(MAKE) $(AM_MAKEFLAGS) include/stamp-h1
|
||||
|
||||
include/stamp-h1: $(top_srcdir)/include/config.h.in $(top_builddir)/config.status
|
||||
@rm -f include/stamp-h1
|
||||
cd $(top_builddir) && $(SHELL) ./config.status include/config.h
|
||||
$(top_srcdir)/include/config.h.in: @MAINTAINER_MODE_TRUE@ $(am__configure_deps)
|
||||
($(am__cd) $(top_srcdir) && $(AUTOHEADER))
|
||||
rm -f include/stamp-h1
|
||||
touch $@
|
||||
|
||||
distclean-hdr:
|
||||
-rm -f include/config.h include/stamp-h1
|
||||
|
||||
mostlyclean-libtool:
|
||||
-rm -f *.lo
|
||||
|
||||
clean-libtool:
|
||||
-rm -rf .libs _libs
|
||||
|
||||
distclean-libtool:
|
||||
-rm -f libtool config.lt
|
||||
install-includeHEADERS: $(include_HEADERS)
|
||||
@$(NORMAL_INSTALL)
|
||||
@list='$(include_HEADERS)'; test -n "$(includedir)" || list=; \
|
||||
if test -n "$$list"; then \
|
||||
echo " $(MKDIR_P) '$(DESTDIR)$(includedir)'"; \
|
||||
$(MKDIR_P) "$(DESTDIR)$(includedir)" || exit 1; \
|
||||
fi; \
|
||||
for p in $$list; do \
|
||||
if test -f "$$p"; then d=; else d="$(srcdir)/"; fi; \
|
||||
echo "$$d$$p"; \
|
||||
done | $(am__base_list) | \
|
||||
while read files; do \
|
||||
echo " $(INSTALL_HEADER) $$files '$(DESTDIR)$(includedir)'"; \
|
||||
$(INSTALL_HEADER) $$files "$(DESTDIR)$(includedir)" || exit $$?; \
|
||||
done
|
||||
|
||||
uninstall-includeHEADERS:
|
||||
@$(NORMAL_UNINSTALL)
|
||||
@list='$(include_HEADERS)'; test -n "$(includedir)" || list=; \
|
||||
files=`for p in $$list; do echo $$p; done | sed -e 's|^.*/||'`; \
|
||||
dir='$(DESTDIR)$(includedir)'; $(am__uninstall_files_from_dir)
|
||||
|
||||
# This directory's subdirectories are mostly independent; you can cd
|
||||
# into them and run 'make' without going through this Makefile.
|
||||
# To change the values of 'make' variables: instead of editing Makefiles,
|
||||
# (1) if the variable is set in 'config.status', edit 'config.status'
|
||||
# (which will cause the Makefiles to be regenerated when you run 'make');
|
||||
# (2) otherwise, pass the desired values on the 'make' command line.
|
||||
$(am__recursive_targets):
|
||||
@fail=; \
|
||||
if $(am__make_keepgoing); then \
|
||||
failcom='fail=yes'; \
|
||||
else \
|
||||
failcom='exit 1'; \
|
||||
fi; \
|
||||
dot_seen=no; \
|
||||
target=`echo $@ | sed s/-recursive//`; \
|
||||
case "$@" in \
|
||||
distclean-* | maintainer-clean-*) list='$(DIST_SUBDIRS)' ;; \
|
||||
*) list='$(SUBDIRS)' ;; \
|
||||
esac; \
|
||||
for subdir in $$list; do \
|
||||
echo "Making $$target in $$subdir"; \
|
||||
if test "$$subdir" = "."; then \
|
||||
dot_seen=yes; \
|
||||
local_target="$$target-am"; \
|
||||
else \
|
||||
local_target="$$target"; \
|
||||
fi; \
|
||||
($(am__cd) $$subdir && $(MAKE) $(AM_MAKEFLAGS) $$local_target) \
|
||||
|| eval $$failcom; \
|
||||
done; \
|
||||
if test "$$dot_seen" = "no"; then \
|
||||
$(MAKE) $(AM_MAKEFLAGS) "$$target-am" || exit 1; \
|
||||
fi; test -z "$$fail"
|
||||
|
||||
ID: $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); mkid -fID $$unique
|
||||
tags: tags-recursive
|
||||
TAGS: tags
|
||||
|
||||
tags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
set x; \
|
||||
here=`pwd`; \
|
||||
if ($(ETAGS) --etags-include --version) >/dev/null 2>&1; then \
|
||||
include_option=--etags-include; \
|
||||
empty_fix=.; \
|
||||
else \
|
||||
include_option=--include; \
|
||||
empty_fix=; \
|
||||
fi; \
|
||||
list='$(SUBDIRS)'; for subdir in $$list; do \
|
||||
if test "$$subdir" = .; then :; else \
|
||||
test ! -f $$subdir/TAGS || \
|
||||
set "$$@" "$$include_option=$$here/$$subdir/TAGS"; \
|
||||
fi; \
|
||||
done; \
|
||||
$(am__define_uniq_tagged_files); \
|
||||
shift; \
|
||||
if test -z "$(ETAGS_ARGS)$$*$$unique"; then :; else \
|
||||
test -n "$$unique" || unique=$$empty_fix; \
|
||||
if test $$# -gt 0; then \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
"$$@" $$unique; \
|
||||
else \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
$$unique; \
|
||||
fi; \
|
||||
fi
|
||||
ctags: ctags-recursive
|
||||
|
||||
CTAGS: ctags
|
||||
ctags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); \
|
||||
test -z "$(CTAGS_ARGS)$$unique" \
|
||||
|| $(CTAGS) $(CTAGSFLAGS) $(AM_CTAGSFLAGS) $(CTAGS_ARGS) \
|
||||
$$unique
|
||||
|
||||
GTAGS:
|
||||
here=`$(am__cd) $(top_builddir) && pwd` \
|
||||
&& $(am__cd) $(top_srcdir) \
|
||||
&& gtags -i $(GTAGS_ARGS) "$$here"
|
||||
cscope: cscope.files
|
||||
test ! -s cscope.files \
|
||||
|| $(CSCOPE) -b -q $(AM_CSCOPEFLAGS) $(CSCOPEFLAGS) -i cscope.files $(CSCOPE_ARGS)
|
||||
clean-cscope:
|
||||
-rm -f cscope.files
|
||||
cscope.files: clean-cscope cscopelist
|
||||
cscopelist: cscopelist-recursive
|
||||
|
||||
cscopelist-am: $(am__tagged_files)
|
||||
list='$(am__tagged_files)'; \
|
||||
case "$(srcdir)" in \
|
||||
[\\/]* | ?:[\\/]*) sdir="$(srcdir)" ;; \
|
||||
*) sdir=$(subdir)/$(srcdir) ;; \
|
||||
esac; \
|
||||
for i in $$list; do \
|
||||
if test -f "$$i"; then \
|
||||
echo "$(subdir)/$$i"; \
|
||||
else \
|
||||
echo "$$sdir/$$i"; \
|
||||
fi; \
|
||||
done >> $(top_builddir)/cscope.files
|
||||
|
||||
distclean-tags:
|
||||
-rm -f TAGS ID GTAGS GRTAGS GSYMS GPATH tags
|
||||
-rm -f cscope.out cscope.in.out cscope.po.out cscope.files
|
||||
|
||||
distdir: $(DISTFILES)
|
||||
$(am__remove_distdir)
|
||||
test -d "$(distdir)" || mkdir "$(distdir)"
|
||||
@srcdirstrip=`echo "$(srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
topsrcdirstrip=`echo "$(top_srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
list='$(DISTFILES)'; \
|
||||
dist_files=`for file in $$list; do echo $$file; done | \
|
||||
sed -e "s|^$$srcdirstrip/||;t" \
|
||||
-e "s|^$$topsrcdirstrip/|$(top_builddir)/|;t"`; \
|
||||
case $$dist_files in \
|
||||
*/*) $(MKDIR_P) `echo "$$dist_files" | \
|
||||
sed '/\//!d;s|^|$(distdir)/|;s,/[^/]*$$,,' | \
|
||||
sort -u` ;; \
|
||||
esac; \
|
||||
for file in $$dist_files; do \
|
||||
if test -f $$file || test -d $$file; then d=.; else d=$(srcdir); fi; \
|
||||
if test -d $$d/$$file; then \
|
||||
dir=`echo "/$$file" | sed -e 's,/[^/]*$$,,'`; \
|
||||
if test -d "$(distdir)/$$file"; then \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
if test -d $(srcdir)/$$file && test $$d != $(srcdir); then \
|
||||
cp -fpR $(srcdir)/$$file "$(distdir)$$dir" || exit 1; \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
cp -fpR $$d/$$file "$(distdir)$$dir" || exit 1; \
|
||||
else \
|
||||
test -f "$(distdir)/$$file" \
|
||||
|| cp -p $$d/$$file "$(distdir)/$$file" \
|
||||
|| exit 1; \
|
||||
fi; \
|
||||
done
|
||||
@list='$(DIST_SUBDIRS)'; for subdir in $$list; do \
|
||||
if test "$$subdir" = .; then :; else \
|
||||
$(am__make_dryrun) \
|
||||
|| test -d "$(distdir)/$$subdir" \
|
||||
|| $(MKDIR_P) "$(distdir)/$$subdir" \
|
||||
|| exit 1; \
|
||||
dir1=$$subdir; dir2="$(distdir)/$$subdir"; \
|
||||
$(am__relativize); \
|
||||
new_distdir=$$reldir; \
|
||||
dir1=$$subdir; dir2="$(top_distdir)"; \
|
||||
$(am__relativize); \
|
||||
new_top_distdir=$$reldir; \
|
||||
echo " (cd $$subdir && $(MAKE) $(AM_MAKEFLAGS) top_distdir="$$new_top_distdir" distdir="$$new_distdir" \\"; \
|
||||
echo " am__remove_distdir=: am__skip_length_check=: am__skip_mode_fix=: distdir)"; \
|
||||
($(am__cd) $$subdir && \
|
||||
$(MAKE) $(AM_MAKEFLAGS) \
|
||||
top_distdir="$$new_top_distdir" \
|
||||
distdir="$$new_distdir" \
|
||||
am__remove_distdir=: \
|
||||
am__skip_length_check=: \
|
||||
am__skip_mode_fix=: \
|
||||
distdir) \
|
||||
|| exit 1; \
|
||||
fi; \
|
||||
done
|
||||
-test -n "$(am__skip_mode_fix)" \
|
||||
|| find "$(distdir)" -type d ! -perm -755 \
|
||||
-exec chmod u+rwx,go+rx {} \; -o \
|
||||
! -type d ! -perm -444 -links 1 -exec chmod a+r {} \; -o \
|
||||
! -type d ! -perm -400 -exec chmod a+r {} \; -o \
|
||||
! -type d ! -perm -444 -exec $(install_sh) -c -m a+r {} {} \; \
|
||||
|| chmod -R a+r "$(distdir)"
|
||||
dist-gzip: distdir
|
||||
tardir=$(distdir) && $(am__tar) | GZIP=$(GZIP_ENV) gzip -c >$(distdir).tar.gz
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
dist-bzip2: distdir
|
||||
tardir=$(distdir) && $(am__tar) | BZIP2=$${BZIP2--9} bzip2 -c >$(distdir).tar.bz2
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
dist-lzip: distdir
|
||||
tardir=$(distdir) && $(am__tar) | lzip -c $${LZIP_OPT--9} >$(distdir).tar.lz
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
dist-xz: distdir
|
||||
tardir=$(distdir) && $(am__tar) | XZ_OPT=$${XZ_OPT--e} xz -c >$(distdir).tar.xz
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
dist-tarZ: distdir
|
||||
@echo WARNING: "Support for shar distribution archives is" \
|
||||
"deprecated." >&2
|
||||
@echo WARNING: "It will be removed altogether in Automake 2.0" >&2
|
||||
tardir=$(distdir) && $(am__tar) | compress -c >$(distdir).tar.Z
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
dist-shar: distdir
|
||||
@echo WARNING: "Support for distribution archives compressed with" \
|
||||
"legacy program 'compress' is deprecated." >&2
|
||||
@echo WARNING: "It will be removed altogether in Automake 2.0" >&2
|
||||
shar $(distdir) | GZIP=$(GZIP_ENV) gzip -c >$(distdir).shar.gz
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
dist-zip: distdir
|
||||
-rm -f $(distdir).zip
|
||||
zip -rq $(distdir).zip $(distdir)
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
dist dist-all:
|
||||
$(MAKE) $(AM_MAKEFLAGS) $(DIST_TARGETS) am__post_remove_distdir='@:'
|
||||
$(am__post_remove_distdir)
|
||||
|
||||
# This target untars the dist file and tries a VPATH configuration. Then
|
||||
# it guarantees that the distribution is self-contained by making another
|
||||
# tarfile.
|
||||
distcheck: dist
|
||||
case '$(DIST_ARCHIVES)' in \
|
||||
*.tar.gz*) \
|
||||
GZIP=$(GZIP_ENV) gzip -dc $(distdir).tar.gz | $(am__untar) ;;\
|
||||
*.tar.bz2*) \
|
||||
bzip2 -dc $(distdir).tar.bz2 | $(am__untar) ;;\
|
||||
*.tar.lz*) \
|
||||
lzip -dc $(distdir).tar.lz | $(am__untar) ;;\
|
||||
*.tar.xz*) \
|
||||
xz -dc $(distdir).tar.xz | $(am__untar) ;;\
|
||||
*.tar.Z*) \
|
||||
uncompress -c $(distdir).tar.Z | $(am__untar) ;;\
|
||||
*.shar.gz*) \
|
||||
GZIP=$(GZIP_ENV) gzip -dc $(distdir).shar.gz | unshar ;;\
|
||||
*.zip*) \
|
||||
unzip $(distdir).zip ;;\
|
||||
esac
|
||||
chmod -R a-w $(distdir)
|
||||
chmod u+w $(distdir)
|
||||
mkdir $(distdir)/_build $(distdir)/_inst
|
||||
chmod a-w $(distdir)
|
||||
test -d $(distdir)/_build || exit 0; \
|
||||
dc_install_base=`$(am__cd) $(distdir)/_inst && pwd | sed -e 's,^[^:\\/]:[\\/],/,'` \
|
||||
&& dc_destdir="$${TMPDIR-/tmp}/am-dc-$$$$/" \
|
||||
&& am__cwd=`pwd` \
|
||||
&& $(am__cd) $(distdir)/_build \
|
||||
&& ../configure \
|
||||
$(AM_DISTCHECK_CONFIGURE_FLAGS) \
|
||||
$(DISTCHECK_CONFIGURE_FLAGS) \
|
||||
--srcdir=.. --prefix="$$dc_install_base" \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) dvi \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) check \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) install \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) installcheck \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) uninstall \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) distuninstallcheck_dir="$$dc_install_base" \
|
||||
distuninstallcheck \
|
||||
&& chmod -R a-w "$$dc_install_base" \
|
||||
&& ({ \
|
||||
(cd ../.. && umask 077 && mkdir "$$dc_destdir") \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) DESTDIR="$$dc_destdir" install \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) DESTDIR="$$dc_destdir" uninstall \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) DESTDIR="$$dc_destdir" \
|
||||
distuninstallcheck_dir="$$dc_destdir" distuninstallcheck; \
|
||||
} || { rm -rf "$$dc_destdir"; exit 1; }) \
|
||||
&& rm -rf "$$dc_destdir" \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) dist \
|
||||
&& rm -rf $(DIST_ARCHIVES) \
|
||||
&& $(MAKE) $(AM_MAKEFLAGS) distcleancheck \
|
||||
&& cd "$$am__cwd" \
|
||||
|| exit 1
|
||||
$(am__post_remove_distdir)
|
||||
@(echo "$(distdir) archives ready for distribution: "; \
|
||||
list='$(DIST_ARCHIVES)'; for i in $$list; do echo $$i; done) | \
|
||||
sed -e 1h -e 1s/./=/g -e 1p -e 1x -e '$$p' -e '$$x'
|
||||
distuninstallcheck:
|
||||
@test -n '$(distuninstallcheck_dir)' || { \
|
||||
echo 'ERROR: trying to run $@ with an empty' \
|
||||
'$$(distuninstallcheck_dir)' >&2; \
|
||||
exit 1; \
|
||||
}; \
|
||||
$(am__cd) '$(distuninstallcheck_dir)' || { \
|
||||
echo 'ERROR: cannot chdir into $(distuninstallcheck_dir)' >&2; \
|
||||
exit 1; \
|
||||
}; \
|
||||
test `$(am__distuninstallcheck_listfiles) | wc -l` -eq 0 \
|
||||
|| { echo "ERROR: files left after uninstall:" ; \
|
||||
if test -n "$(DESTDIR)"; then \
|
||||
echo " (check DESTDIR support)"; \
|
||||
fi ; \
|
||||
$(distuninstallcheck_listfiles) ; \
|
||||
exit 1; } >&2
|
||||
distcleancheck: distclean
|
||||
@if test '$(srcdir)' = . ; then \
|
||||
echo "ERROR: distcleancheck can only run from a VPATH build" ; \
|
||||
exit 1 ; \
|
||||
fi
|
||||
@test `$(distcleancheck_listfiles) | wc -l` -eq 0 \
|
||||
|| { echo "ERROR: files left in build directory after distclean:" ; \
|
||||
$(distcleancheck_listfiles) ; \
|
||||
exit 1; } >&2
|
||||
check-am: all-am
|
||||
check: check-recursive
|
||||
all-am: Makefile $(HEADERS)
|
||||
installdirs: installdirs-recursive
|
||||
installdirs-am:
|
||||
for dir in "$(DESTDIR)$(includedir)"; do \
|
||||
test -z "$$dir" || $(MKDIR_P) "$$dir"; \
|
||||
done
|
||||
install: install-recursive
|
||||
install-exec: install-exec-recursive
|
||||
install-data: install-data-recursive
|
||||
uninstall: uninstall-recursive
|
||||
|
||||
install-am: all-am
|
||||
@$(MAKE) $(AM_MAKEFLAGS) install-exec-am install-data-am
|
||||
|
||||
installcheck: installcheck-recursive
|
||||
install-strip:
|
||||
if test -z '$(STRIP)'; then \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
install; \
|
||||
else \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
"INSTALL_PROGRAM_ENV=STRIPPROG='$(STRIP)'" install; \
|
||||
fi
|
||||
mostlyclean-generic:
|
||||
|
||||
clean-generic:
|
||||
|
||||
distclean-generic:
|
||||
-test -z "$(CONFIG_CLEAN_FILES)" || rm -f $(CONFIG_CLEAN_FILES)
|
||||
-test . = "$(srcdir)" || test -z "$(CONFIG_CLEAN_VPATH_FILES)" || rm -f $(CONFIG_CLEAN_VPATH_FILES)
|
||||
|
||||
maintainer-clean-generic:
|
||||
@echo "This command is intended for maintainers to use"
|
||||
@echo "it deletes files that may require special tools to rebuild."
|
||||
clean: clean-recursive
|
||||
|
||||
clean-am: clean-generic clean-libtool mostlyclean-am
|
||||
|
||||
distclean: distclean-recursive
|
||||
-rm -f $(am__CONFIG_DISTCLEAN_FILES)
|
||||
-rm -f Makefile
|
||||
distclean-am: clean-am distclean-generic distclean-hdr \
|
||||
distclean-libtool distclean-tags
|
||||
|
||||
dvi: dvi-recursive
|
||||
|
||||
dvi-am:
|
||||
|
||||
html: html-recursive
|
||||
|
||||
html-am:
|
||||
|
||||
info: info-recursive
|
||||
|
||||
info-am:
|
||||
|
||||
install-data-am: install-includeHEADERS
|
||||
|
||||
install-dvi: install-dvi-recursive
|
||||
|
||||
install-dvi-am:
|
||||
|
||||
install-exec-am:
|
||||
|
||||
install-html: install-html-recursive
|
||||
|
||||
install-html-am:
|
||||
|
||||
install-info: install-info-recursive
|
||||
|
||||
install-info-am:
|
||||
|
||||
install-man:
|
||||
|
||||
install-pdf: install-pdf-recursive
|
||||
|
||||
install-pdf-am:
|
||||
|
||||
install-ps: install-ps-recursive
|
||||
|
||||
install-ps-am:
|
||||
|
||||
installcheck-am:
|
||||
|
||||
maintainer-clean: maintainer-clean-recursive
|
||||
-rm -f $(am__CONFIG_DISTCLEAN_FILES)
|
||||
-rm -rf $(top_srcdir)/autom4te.cache
|
||||
-rm -f Makefile
|
||||
maintainer-clean-am: distclean-am maintainer-clean-generic
|
||||
|
||||
mostlyclean: mostlyclean-recursive
|
||||
|
||||
mostlyclean-am: mostlyclean-generic mostlyclean-libtool
|
||||
|
||||
pdf: pdf-recursive
|
||||
|
||||
pdf-am:
|
||||
|
||||
ps: ps-recursive
|
||||
|
||||
ps-am:
|
||||
|
||||
uninstall-am: uninstall-includeHEADERS
|
||||
|
||||
.MAKE: $(am__recursive_targets) install-am install-strip
|
||||
|
||||
.PHONY: $(am__recursive_targets) CTAGS GTAGS TAGS all all-am \
|
||||
am--refresh check check-am clean clean-cscope clean-generic \
|
||||
clean-libtool cscope cscopelist-am ctags ctags-am dist \
|
||||
dist-all dist-bzip2 dist-gzip dist-lzip dist-shar dist-tarZ \
|
||||
dist-xz dist-zip distcheck distclean distclean-generic \
|
||||
distclean-hdr distclean-libtool distclean-tags distcleancheck \
|
||||
distdir distuninstallcheck dvi dvi-am html html-am info \
|
||||
info-am install install-am install-data install-data-am \
|
||||
install-dvi install-dvi-am install-exec install-exec-am \
|
||||
install-html install-html-am install-includeHEADERS \
|
||||
install-info install-info-am install-man install-pdf \
|
||||
install-pdf-am install-ps install-ps-am install-strip \
|
||||
installcheck installcheck-am installdirs installdirs-am \
|
||||
maintainer-clean maintainer-clean-generic mostlyclean \
|
||||
mostlyclean-generic mostlyclean-libtool pdf pdf-am ps ps-am \
|
||||
tags tags-am uninstall uninstall-am uninstall-includeHEADERS
|
||||
|
||||
|
||||
# Tell versions [3.59,3.63) of GNU make to not export all variables.
|
||||
# Otherwise a system limit (for SysV at least) may be exceeded.
|
||||
.NOEXPORT:
|
17
README
|
@ -1,4 +1,4 @@
|
|||
This is GF-Complete, Revision 1.02. January 1, 2014.
|
||||
This is GF-Complete, Revision 1.03. January 1, 2015.
|
||||
|
||||
Authors: James S. Plank (University of Tennessee)
|
||||
Ethan L. Miller (UC Santa Cruz)
|
||||
|
@ -8,25 +8,14 @@ Authors: James S. Plank (University of Tennessee)
|
|||
Adam W. Disney (University of Tennessee,
|
||||
Allen C. McBride (University of Tennessee)
|
||||
|
||||
The programmer's manual and tutorial is provided in two places:
|
||||
|
||||
1.) A copy is hosted on BitBucket at https://bitbucket.org/jimplank/gf-complete/downloads/GF-Complete-Manual.pdf
|
||||
2.) A copy is also available at http://www.cs.utk.edu/~plank/plank/papers/GF-Complete-Manual-1.02.pdf
|
||||
The user's manual is in the file Manual.pdf.
|
||||
|
||||
The online home for GF-Complete is:
|
||||
|
||||
- https://bitbucket.org/jimplank/gf-complete
|
||||
|
||||
If you want to cite GF-Complete in a paper, I suggest citing the
|
||||
technical report version. The precise citation information for that
|
||||
is in http://www.cs.utk.edu/~plank/plank/papers/CS-13-716.html.
|
||||
- https://jerasure.org/jerasure/gf-complete
|
||||
|
||||
To compile, do:
|
||||
|
||||
./configure
|
||||
make
|
||||
sudo make install
|
||||
|
||||
To run the tests, do:
|
||||
|
||||
make check
|
||||
|
|
11
README.txt
|
@ -1,4 +1,4 @@
|
|||
This is GF-Complete, Revision 1.02. January 1, 2014.
|
||||
This is GF-Complete, Revision 1.03. January 1, 2015.
|
||||
|
||||
Authors: James S. Plank (University of Tennessee)
|
||||
Ethan L. Miller (UC Santa Cruz)
|
||||
|
@ -8,16 +8,11 @@ Authors: James S. Plank (University of Tennessee)
|
|||
Adam W. Disney (University of Tennessee,
|
||||
Allen C. McBride (University of Tennessee)
|
||||
|
||||
The user's manual is in the file Manual.pdf. You may also get a copy of that
|
||||
manual at http://www.cs.utk.edu/~plank/plank/papers/GF-Complete-Manual-1.02.pdf.
|
||||
The user's manual is in the file Manual.pdf.
|
||||
|
||||
The online home for GF-Complete is:
|
||||
|
||||
- https://bitbucket.org/jimplank/gf-complete
|
||||
|
||||
If you want to cite GF-Complete in a paper, I suggest citing the
|
||||
technical report version. The precise citation information for that
|
||||
is in http://www.cs.utk.edu/~plank/plank/papers/CS-13-716.html.
|
||||
- http://jerasure.org/jerasure/gf-complete
|
||||
|
||||
To compile, do:
|
||||
|
||||
|
|
347
compile
|
@ -1,347 +0,0 @@
|
|||
#! /bin/sh
|
||||
# Wrapper for compilers which do not understand '-c -o'.
|
||||
|
||||
scriptversion=2012-10-14.11; # UTC
|
||||
|
||||
# Copyright (C) 1999-2013 Free Software Foundation, Inc.
|
||||
# Written by Tom Tromey <tromey@cygnus.com>.
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation; either version 2, or (at your option)
|
||||
# any later version.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
||||
# As a special exception to the GNU General Public License, if you
|
||||
# distribute this file as part of a program that contains a
|
||||
# configuration script generated by Autoconf, you may include it under
|
||||
# the same distribution terms that you use for the rest of that program.
|
||||
|
||||
# This file is maintained in Automake, please report
|
||||
# bugs to <bug-automake@gnu.org> or send patches to
|
||||
# <automake-patches@gnu.org>.
|
||||
|
||||
nl='
|
||||
'
|
||||
|
||||
# We need space, tab and new line, in precisely that order. Quoting is
|
||||
# there to prevent tools from complaining about whitespace usage.
|
||||
IFS=" "" $nl"
|
||||
|
||||
file_conv=
|
||||
|
||||
# func_file_conv build_file lazy
|
||||
# Convert a $build file to $host form and store it in $file
|
||||
# Currently only supports Windows hosts. If the determined conversion
|
||||
# type is listed in (the comma separated) LAZY, no conversion will
|
||||
# take place.
|
||||
func_file_conv ()
|
||||
{
|
||||
file=$1
|
||||
case $file in
|
||||
/ | /[!/]*) # absolute file, and not a UNC file
|
||||
if test -z "$file_conv"; then
|
||||
# lazily determine how to convert abs files
|
||||
case `uname -s` in
|
||||
MINGW*)
|
||||
file_conv=mingw
|
||||
;;
|
||||
CYGWIN*)
|
||||
file_conv=cygwin
|
||||
;;
|
||||
*)
|
||||
file_conv=wine
|
||||
;;
|
||||
esac
|
||||
fi
|
||||
case $file_conv/,$2, in
|
||||
*,$file_conv,*)
|
||||
;;
|
||||
mingw/*)
|
||||
file=`cmd //C echo "$file " | sed -e 's/"\(.*\) " *$/\1/'`
|
||||
;;
|
||||
cygwin/*)
|
||||
file=`cygpath -m "$file" || echo "$file"`
|
||||
;;
|
||||
wine/*)
|
||||
file=`winepath -w "$file" || echo "$file"`
|
||||
;;
|
||||
esac
|
||||
;;
|
||||
esac
|
||||
}
|
||||
|
||||
# func_cl_dashL linkdir
|
||||
# Make cl look for libraries in LINKDIR
|
||||
func_cl_dashL ()
|
||||
{
|
||||
func_file_conv "$1"
|
||||
if test -z "$lib_path"; then
|
||||
lib_path=$file
|
||||
else
|
||||
lib_path="$lib_path;$file"
|
||||
fi
|
||||
linker_opts="$linker_opts -LIBPATH:$file"
|
||||
}
|
||||
|
||||
# func_cl_dashl library
|
||||
# Do a library search-path lookup for cl
|
||||
func_cl_dashl ()
|
||||
{
|
||||
lib=$1
|
||||
found=no
|
||||
save_IFS=$IFS
|
||||
IFS=';'
|
||||
for dir in $lib_path $LIB
|
||||
do
|
||||
IFS=$save_IFS
|
||||
if $shared && test -f "$dir/$lib.dll.lib"; then
|
||||
found=yes
|
||||
lib=$dir/$lib.dll.lib
|
||||
break
|
||||
fi
|
||||
if test -f "$dir/$lib.lib"; then
|
||||
found=yes
|
||||
lib=$dir/$lib.lib
|
||||
break
|
||||
fi
|
||||
if test -f "$dir/lib$lib.a"; then
|
||||
found=yes
|
||||
lib=$dir/lib$lib.a
|
||||
break
|
||||
fi
|
||||
done
|
||||
IFS=$save_IFS
|
||||
|
||||
if test "$found" != yes; then
|
||||
lib=$lib.lib
|
||||
fi
|
||||
}
|
||||
|
||||
# func_cl_wrapper cl arg...
|
||||
# Adjust compile command to suit cl
|
||||
func_cl_wrapper ()
|
||||
{
|
||||
# Assume a capable shell
|
||||
lib_path=
|
||||
shared=:
|
||||
linker_opts=
|
||||
for arg
|
||||
do
|
||||
if test -n "$eat"; then
|
||||
eat=
|
||||
else
|
||||
case $1 in
|
||||
-o)
|
||||
# configure might choose to run compile as 'compile cc -o foo foo.c'.
|
||||
eat=1
|
||||
case $2 in
|
||||
*.o | *.[oO][bB][jJ])
|
||||
func_file_conv "$2"
|
||||
set x "$@" -Fo"$file"
|
||||
shift
|
||||
;;
|
||||
*)
|
||||
func_file_conv "$2"
|
||||
set x "$@" -Fe"$file"
|
||||
shift
|
||||
;;
|
||||
esac
|
||||
;;
|
||||
-I)
|
||||
eat=1
|
||||
func_file_conv "$2" mingw
|
||||
set x "$@" -I"$file"
|
||||
shift
|
||||
;;
|
||||
-I*)
|
||||
func_file_conv "${1#-I}" mingw
|
||||
set x "$@" -I"$file"
|
||||
shift
|
||||
;;
|
||||
-l)
|
||||
eat=1
|
||||
func_cl_dashl "$2"
|
||||
set x "$@" "$lib"
|
||||
shift
|
||||
;;
|
||||
-l*)
|
||||
func_cl_dashl "${1#-l}"
|
||||
set x "$@" "$lib"
|
||||
shift
|
||||
;;
|
||||
-L)
|
||||
eat=1
|
||||
func_cl_dashL "$2"
|
||||
;;
|
||||
-L*)
|
||||
func_cl_dashL "${1#-L}"
|
||||
;;
|
||||
-static)
|
||||
shared=false
|
||||
;;
|
||||
-Wl,*)
|
||||
arg=${1#-Wl,}
|
||||
save_ifs="$IFS"; IFS=','
|
||||
for flag in $arg; do
|
||||
IFS="$save_ifs"
|
||||
linker_opts="$linker_opts $flag"
|
||||
done
|
||||
IFS="$save_ifs"
|
||||
;;
|
||||
-Xlinker)
|
||||
eat=1
|
||||
linker_opts="$linker_opts $2"
|
||||
;;
|
||||
-*)
|
||||
set x "$@" "$1"
|
||||
shift
|
||||
;;
|
||||
*.cc | *.CC | *.cxx | *.CXX | *.[cC]++)
|
||||
func_file_conv "$1"
|
||||
set x "$@" -Tp"$file"
|
||||
shift
|
||||
;;
|
||||
*.c | *.cpp | *.CPP | *.lib | *.LIB | *.Lib | *.OBJ | *.obj | *.[oO])
|
||||
func_file_conv "$1" mingw
|
||||
set x "$@" "$file"
|
||||
shift
|
||||
;;
|
||||
*)
|
||||
set x "$@" "$1"
|
||||
shift
|
||||
;;
|
||||
esac
|
||||
fi
|
||||
shift
|
||||
done
|
||||
if test -n "$linker_opts"; then
|
||||
linker_opts="-link$linker_opts"
|
||||
fi
|
||||
exec "$@" $linker_opts
|
||||
exit 1
|
||||
}
|
||||
|
||||
eat=
|
||||
|
||||
case $1 in
|
||||
'')
|
||||
echo "$0: No command. Try '$0 --help' for more information." 1>&2
|
||||
exit 1;
|
||||
;;
|
||||
-h | --h*)
|
||||
cat <<\EOF
|
||||
Usage: compile [--help] [--version] PROGRAM [ARGS]
|
||||
|
||||
Wrapper for compilers which do not understand '-c -o'.
|
||||
Remove '-o dest.o' from ARGS, run PROGRAM with the remaining
|
||||
arguments, and rename the output as expected.
|
||||
|
||||
If you are trying to build a whole package this is not the
|
||||
right script to run: please start by reading the file 'INSTALL'.
|
||||
|
||||
Report bugs to <bug-automake@gnu.org>.
|
||||
EOF
|
||||
exit $?
|
||||
;;
|
||||
-v | --v*)
|
||||
echo "compile $scriptversion"
|
||||
exit $?
|
||||
;;
|
||||
cl | *[/\\]cl | cl.exe | *[/\\]cl.exe )
|
||||
func_cl_wrapper "$@" # Doesn't return...
|
||||
;;
|
||||
esac
|
||||
|
||||
ofile=
|
||||
cfile=
|
||||
|
||||
for arg
|
||||
do
|
||||
if test -n "$eat"; then
|
||||
eat=
|
||||
else
|
||||
case $1 in
|
||||
-o)
|
||||
# configure might choose to run compile as 'compile cc -o foo foo.c'.
|
||||
# So we strip '-o arg' only if arg is an object.
|
||||
eat=1
|
||||
case $2 in
|
||||
*.o | *.obj)
|
||||
ofile=$2
|
||||
;;
|
||||
*)
|
||||
set x "$@" -o "$2"
|
||||
shift
|
||||
;;
|
||||
esac
|
||||
;;
|
||||
*.c)
|
||||
cfile=$1
|
||||
set x "$@" "$1"
|
||||
shift
|
||||
;;
|
||||
*)
|
||||
set x "$@" "$1"
|
||||
shift
|
||||
;;
|
||||
esac
|
||||
fi
|
||||
shift
|
||||
done
|
||||
|
||||
if test -z "$ofile" || test -z "$cfile"; then
|
||||
# If no '-o' option was seen then we might have been invoked from a
|
||||
# pattern rule where we don't need one. That is ok -- this is a
|
||||
# normal compilation that the losing compiler can handle. If no
|
||||
# '.c' file was seen then we are probably linking. That is also
|
||||
# ok.
|
||||
exec "$@"
|
||||
fi
|
||||
|
||||
# Name of file we expect compiler to create.
|
||||
cofile=`echo "$cfile" | sed 's|^.*[\\/]||; s|^[a-zA-Z]:||; s/\.c$/.o/'`
|
||||
|
||||
# Create the lock directory.
|
||||
# Note: use '[/\\:.-]' here to ensure that we don't use the same name
|
||||
# that we are using for the .o file. Also, base the name on the expected
|
||||
# object file name, since that is what matters with a parallel build.
|
||||
lockdir=`echo "$cofile" | sed -e 's|[/\\:.-]|_|g'`.d
|
||||
while true; do
|
||||
if mkdir "$lockdir" >/dev/null 2>&1; then
|
||||
break
|
||||
fi
|
||||
sleep 1
|
||||
done
|
||||
# FIXME: race condition here if user kills between mkdir and trap.
|
||||
trap "rmdir '$lockdir'; exit 1" 1 2 15
|
||||
|
||||
# Run the compile.
|
||||
"$@"
|
||||
ret=$?
|
||||
|
||||
if test -f "$cofile"; then
|
||||
test "$cofile" = "$ofile" || mv "$cofile" "$ofile"
|
||||
elif test -f "${cofile}bj"; then
|
||||
test "${cofile}bj" = "$ofile" || mv "${cofile}bj" "$ofile"
|
||||
fi
|
||||
|
||||
rmdir "$lockdir"
|
||||
exit $ret
|
||||
|
||||
# Local Variables:
|
||||
# mode: shell-script
|
||||
# sh-indentation: 2
|
||||
# eval: (add-hook 'write-file-hooks 'time-stamp)
|
||||
# time-stamp-start: "scriptversion="
|
||||
# time-stamp-format: "%:y-%02m-%02d.%02H"
|
||||
# time-stamp-time-zone: "UTC"
|
||||
# time-stamp-end: "; # UTC"
|
||||
# End:
|
67
configure.ac
|
@ -3,9 +3,12 @@
|
|||
# FIXME - add project url as the last argument
|
||||
AC_INIT(gf-complete, 1.0)
|
||||
|
||||
# Override default CFLAGS
|
||||
: ${CFLAGS="-Wall -Wpointer-arith -O3 -g"}
|
||||
|
||||
AC_PREREQ([2.61])
|
||||
|
||||
AM_INIT_AUTOMAKE([no-dependencies], [foreign])
|
||||
AM_INIT_AUTOMAKE([no-dependencies foreign parallel-tests])
|
||||
LT_INIT # libtool
|
||||
|
||||
AC_CONFIG_HEADER(include/config.h)
|
||||
|
@ -16,13 +19,69 @@ AC_CONFIG_MACRO_DIR([m4])
|
|||
# This prevents './configure; make' from trying to run autotools.
|
||||
AM_MAINTAINER_MODE([disable])
|
||||
|
||||
# Override default CFLAGS
|
||||
CFLAGS="-Wall -Wpointer-arith -O3 -g"
|
||||
|
||||
dnl Compiling with per-target flags requires AM_PROG_CC_C_O.
|
||||
AC_PROG_CC
|
||||
|
||||
# Check for functions to provide aligned memory
|
||||
#
|
||||
AC_CHECK_FUNCS([posix_memalign],
|
||||
[found_memalign=yes; break])
|
||||
|
||||
AS_IF([test "x$found_memalign" != "xyes"], [AC_MSG_WARN([No function for aligned memory allocation found])])
|
||||
|
||||
AC_ARG_ENABLE([debug-functions],
|
||||
AS_HELP_STRING([--enable-debug-func], [Enable debugging of functions selected]))
|
||||
AS_IF([test "x$enable_debug_func" = "xyes"], [CPPFLAGS="$CPPFLAGS -DDEBUG_FUNCTIONS"])
|
||||
|
||||
AC_ARG_ENABLE([debug-cpu],
|
||||
AS_HELP_STRING([--enable-debug-cpu], [Enable debugging of SIMD detection]))
|
||||
AS_IF([test "x$enable_debug_cpu" = "xyes"], [CPPFLAGS="$CPPFLAGS -DDEBUG_CPU_DETECTION"])
|
||||
|
||||
AX_EXT()
|
||||
|
||||
AC_ARG_ENABLE([neon],
|
||||
AS_HELP_STRING([--disable-neon], [Build without NEON optimizations]))
|
||||
|
||||
AS_IF([test "x$enable_neon" != "xno"],
|
||||
[noneon_CPPFLAGS=$CPPFLAGS
|
||||
CPPFLAGS="$CPPFLAGS $SIMD_FLAGS"
|
||||
AC_CHECK_HEADER([arm_neon.h],
|
||||
[have_neon=yes],
|
||||
[have_neon=no
|
||||
CPPFLAGS=$noneon_CPPFLAGS])],
|
||||
[have_neon=no
|
||||
AS_IF([test "x$ax_cv_have_neon_ext" = "xyes"],
|
||||
[SIMD_FLAGS=""])
|
||||
])
|
||||
|
||||
AS_IF([test "x$have_neon" = "xno"],
|
||||
[AS_IF([test "x$enable_neon" = "xyes"],
|
||||
[AC_MSG_ERROR([neon requested but arm_neon.h not found])])
|
||||
])
|
||||
AM_CONDITIONAL([HAVE_NEON], [test "x$have_neon" = "xyes"])
|
||||
|
||||
AC_ARG_ENABLE([sse],
|
||||
AS_HELP_STRING([--disable-sse], [Build without SSE optimizations]),
|
||||
[if test "x$enableval" = "xno" ; then
|
||||
SIMD_FLAGS=""
|
||||
echo "DISABLED SSE!!!"
|
||||
fi]
|
||||
)
|
||||
|
||||
AC_ARG_ENABLE([valgrind],
|
||||
[AS_HELP_STRING([--enable-valgrind], [run tests with valgrind])],
|
||||
[],
|
||||
[enable_valgrind=no])
|
||||
AM_CONDITIONAL(ENABLE_VALGRIND, test "x$enable_valgrind" != xno)
|
||||
|
||||
AC_ARG_ENABLE([avx], AS_HELP_STRING([--enable-avx], [Build with AVX optimizations]))
|
||||
AX_CHECK_COMPILE_FLAG(-mavx, [ax_cv_support_avx=yes], [])
|
||||
|
||||
AS_IF([test "x$enable_avx" = "xyes"],
|
||||
[AS_IF([test "x$ax_cv_support_avx" = "xno"],
|
||||
[AC_MSG_ERROR([AVX requested but compiler does not support -mavx])],
|
||||
[SIMD_FLAGS="$SIMD_FLAGS -mavx"])
|
||||
])
|
||||
|
||||
AC_CONFIG_FILES([Makefile src/Makefile tools/Makefile test/Makefile examples/Makefile])
|
||||
AC_OUTPUT
|
||||
|
|
791
depcomp
|
@ -1,791 +0,0 @@
|
|||
#! /bin/sh
|
||||
# depcomp - compile a program generating dependencies as side-effects
|
||||
|
||||
scriptversion=2013-05-30.07; # UTC
|
||||
|
||||
# Copyright (C) 1999-2013 Free Software Foundation, Inc.
|
||||
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation; either version 2, or (at your option)
|
||||
# any later version.
|
||||
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
||||
# As a special exception to the GNU General Public License, if you
|
||||
# distribute this file as part of a program that contains a
|
||||
# configuration script generated by Autoconf, you may include it under
|
||||
# the same distribution terms that you use for the rest of that program.
|
||||
|
||||
# Originally written by Alexandre Oliva <oliva@dcc.unicamp.br>.
|
||||
|
||||
case $1 in
|
||||
'')
|
||||
echo "$0: No command. Try '$0 --help' for more information." 1>&2
|
||||
exit 1;
|
||||
;;
|
||||
-h | --h*)
|
||||
cat <<\EOF
|
||||
Usage: depcomp [--help] [--version] PROGRAM [ARGS]
|
||||
|
||||
Run PROGRAMS ARGS to compile a file, generating dependencies
|
||||
as side-effects.
|
||||
|
||||
Environment variables:
|
||||
depmode Dependency tracking mode.
|
||||
source Source file read by 'PROGRAMS ARGS'.
|
||||
object Object file output by 'PROGRAMS ARGS'.
|
||||
DEPDIR directory where to store dependencies.
|
||||
depfile Dependency file to output.
|
||||
tmpdepfile Temporary file to use when outputting dependencies.
|
||||
libtool Whether libtool is used (yes/no).
|
||||
|
||||
Report bugs to <bug-automake@gnu.org>.
|
||||
EOF
|
||||
exit $?
|
||||
;;
|
||||
-v | --v*)
|
||||
echo "depcomp $scriptversion"
|
||||
exit $?
|
||||
;;
|
||||
esac
|
||||
|
||||
# Get the directory component of the given path, and save it in the
|
||||
# global variables '$dir'. Note that this directory component will
|
||||
# be either empty or ending with a '/' character. This is deliberate.
|
||||
set_dir_from ()
|
||||
{
|
||||
case $1 in
|
||||
*/*) dir=`echo "$1" | sed -e 's|/[^/]*$|/|'`;;
|
||||
*) dir=;;
|
||||
esac
|
||||
}
|
||||
|
||||
# Get the suffix-stripped basename of the given path, and save it the
|
||||
# global variable '$base'.
|
||||
set_base_from ()
|
||||
{
|
||||
base=`echo "$1" | sed -e 's|^.*/||' -e 's/\.[^.]*$//'`
|
||||
}
|
||||
|
||||
# If no dependency file was actually created by the compiler invocation,
|
||||
# we still have to create a dummy depfile, to avoid errors with the
|
||||
# Makefile "include basename.Plo" scheme.
|
||||
make_dummy_depfile ()
|
||||
{
|
||||
echo "#dummy" > "$depfile"
|
||||
}
|
||||
|
||||
# Factor out some common post-processing of the generated depfile.
|
||||
# Requires the auxiliary global variable '$tmpdepfile' to be set.
|
||||
aix_post_process_depfile ()
|
||||
{
|
||||
# If the compiler actually managed to produce a dependency file,
|
||||
# post-process it.
|
||||
if test -f "$tmpdepfile"; then
|
||||
# Each line is of the form 'foo.o: dependency.h'.
|
||||
# Do two passes, one to just change these to
|
||||
# $object: dependency.h
|
||||
# and one to simply output
|
||||
# dependency.h:
|
||||
# which is needed to avoid the deleted-header problem.
|
||||
{ sed -e "s,^.*\.[$lower]*:,$object:," < "$tmpdepfile"
|
||||
sed -e "s,^.*\.[$lower]*:[$tab ]*,," -e 's,$,:,' < "$tmpdepfile"
|
||||
} > "$depfile"
|
||||
rm -f "$tmpdepfile"
|
||||
else
|
||||
make_dummy_depfile
|
||||
fi
|
||||
}
|
||||
|
||||
# A tabulation character.
|
||||
tab=' '
|
||||
# A newline character.
|
||||
nl='
|
||||
'
|
||||
# Character ranges might be problematic outside the C locale.
|
||||
# These definitions help.
|
||||
upper=ABCDEFGHIJKLMNOPQRSTUVWXYZ
|
||||
lower=abcdefghijklmnopqrstuvwxyz
|
||||
digits=0123456789
|
||||
alpha=${upper}${lower}
|
||||
|
||||
if test -z "$depmode" || test -z "$source" || test -z "$object"; then
|
||||
echo "depcomp: Variables source, object and depmode must be set" 1>&2
|
||||
exit 1
|
||||
fi
|
||||
|
||||
# Dependencies for sub/bar.o or sub/bar.obj go into sub/.deps/bar.Po.
|
||||
depfile=${depfile-`echo "$object" |
|
||||
sed 's|[^\\/]*$|'${DEPDIR-.deps}'/&|;s|\.\([^.]*\)$|.P\1|;s|Pobj$|Po|'`}
|
||||
tmpdepfile=${tmpdepfile-`echo "$depfile" | sed 's/\.\([^.]*\)$/.T\1/'`}
|
||||
|
||||
rm -f "$tmpdepfile"
|
||||
|
||||
# Avoid interferences from the environment.
|
||||
gccflag= dashmflag=
|
||||
|
||||
# Some modes work just like other modes, but use different flags. We
|
||||
# parameterize here, but still list the modes in the big case below,
|
||||
# to make depend.m4 easier to write. Note that we *cannot* use a case
|
||||
# here, because this file can only contain one case statement.
|
||||
if test "$depmode" = hp; then
|
||||
# HP compiler uses -M and no extra arg.
|
||||
gccflag=-M
|
||||
depmode=gcc
|
||||
fi
|
||||
|
||||
if test "$depmode" = dashXmstdout; then
|
||||
# This is just like dashmstdout with a different argument.
|
||||
dashmflag=-xM
|
||||
depmode=dashmstdout
|
||||
fi
|
||||
|
||||
cygpath_u="cygpath -u -f -"
|
||||
if test "$depmode" = msvcmsys; then
|
||||
# This is just like msvisualcpp but w/o cygpath translation.
|
||||
# Just convert the backslash-escaped backslashes to single forward
|
||||
# slashes to satisfy depend.m4
|
||||
cygpath_u='sed s,\\\\,/,g'
|
||||
depmode=msvisualcpp
|
||||
fi
|
||||
|
||||
if test "$depmode" = msvc7msys; then
|
||||
# This is just like msvc7 but w/o cygpath translation.
|
||||
# Just convert the backslash-escaped backslashes to single forward
|
||||
# slashes to satisfy depend.m4
|
||||
cygpath_u='sed s,\\\\,/,g'
|
||||
depmode=msvc7
|
||||
fi
|
||||
|
||||
if test "$depmode" = xlc; then
|
||||
# IBM C/C++ Compilers xlc/xlC can output gcc-like dependency information.
|
||||
gccflag=-qmakedep=gcc,-MF
|
||||
depmode=gcc
|
||||
fi
|
||||
|
||||
case "$depmode" in
|
||||
gcc3)
|
||||
## gcc 3 implements dependency tracking that does exactly what
|
||||
## we want. Yay! Note: for some reason libtool 1.4 doesn't like
|
||||
## it if -MD -MP comes after the -MF stuff. Hmm.
|
||||
## Unfortunately, FreeBSD c89 acceptance of flags depends upon
|
||||
## the command line argument order; so add the flags where they
|
||||
## appear in depend2.am. Note that the slowdown incurred here
|
||||
## affects only configure: in makefiles, %FASTDEP% shortcuts this.
|
||||
for arg
|
||||
do
|
||||
case $arg in
|
||||
-c) set fnord "$@" -MT "$object" -MD -MP -MF "$tmpdepfile" "$arg" ;;
|
||||
*) set fnord "$@" "$arg" ;;
|
||||
esac
|
||||
shift # fnord
|
||||
shift # $arg
|
||||
done
|
||||
"$@"
|
||||
stat=$?
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile"
|
||||
exit $stat
|
||||
fi
|
||||
mv "$tmpdepfile" "$depfile"
|
||||
;;
|
||||
|
||||
gcc)
|
||||
## Note that this doesn't just cater to obsosete pre-3.x GCC compilers.
|
||||
## but also to in-use compilers like IMB xlc/xlC and the HP C compiler.
|
||||
## (see the conditional assignment to $gccflag above).
|
||||
## There are various ways to get dependency output from gcc. Here's
|
||||
## why we pick this rather obscure method:
|
||||
## - Don't want to use -MD because we'd like the dependencies to end
|
||||
## up in a subdir. Having to rename by hand is ugly.
|
||||
## (We might end up doing this anyway to support other compilers.)
|
||||
## - The DEPENDENCIES_OUTPUT environment variable makes gcc act like
|
||||
## -MM, not -M (despite what the docs say). Also, it might not be
|
||||
## supported by the other compilers which use the 'gcc' depmode.
|
||||
## - Using -M directly means running the compiler twice (even worse
|
||||
## than renaming).
|
||||
if test -z "$gccflag"; then
|
||||
gccflag=-MD,
|
||||
fi
|
||||
"$@" -Wp,"$gccflag$tmpdepfile"
|
||||
stat=$?
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile"
|
||||
exit $stat
|
||||
fi
|
||||
rm -f "$depfile"
|
||||
echo "$object : \\" > "$depfile"
|
||||
# The second -e expression handles DOS-style file names with drive
|
||||
# letters.
|
||||
sed -e 's/^[^:]*: / /' \
|
||||
-e 's/^['$alpha']:\/[^:]*: / /' < "$tmpdepfile" >> "$depfile"
|
||||
## This next piece of magic avoids the "deleted header file" problem.
|
||||
## The problem is that when a header file which appears in a .P file
|
||||
## is deleted, the dependency causes make to die (because there is
|
||||
## typically no way to rebuild the header). We avoid this by adding
|
||||
## dummy dependencies for each header file. Too bad gcc doesn't do
|
||||
## this for us directly.
|
||||
## Some versions of gcc put a space before the ':'. On the theory
|
||||
## that the space means something, we add a space to the output as
|
||||
## well. hp depmode also adds that space, but also prefixes the VPATH
|
||||
## to the object. Take care to not repeat it in the output.
|
||||
## Some versions of the HPUX 10.20 sed can't process this invocation
|
||||
## correctly. Breaking it into two sed invocations is a workaround.
|
||||
tr ' ' "$nl" < "$tmpdepfile" \
|
||||
| sed -e 's/^\\$//' -e '/^$/d' -e "s|.*$object$||" -e '/:$/d' \
|
||||
| sed -e 's/$/ :/' >> "$depfile"
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
hp)
|
||||
# This case exists only to let depend.m4 do its work. It works by
|
||||
# looking at the text of this script. This case will never be run,
|
||||
# since it is checked for above.
|
||||
exit 1
|
||||
;;
|
||||
|
||||
sgi)
|
||||
if test "$libtool" = yes; then
|
||||
"$@" "-Wp,-MDupdate,$tmpdepfile"
|
||||
else
|
||||
"$@" -MDupdate "$tmpdepfile"
|
||||
fi
|
||||
stat=$?
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile"
|
||||
exit $stat
|
||||
fi
|
||||
rm -f "$depfile"
|
||||
|
||||
if test -f "$tmpdepfile"; then # yes, the sourcefile depend on other files
|
||||
echo "$object : \\" > "$depfile"
|
||||
# Clip off the initial element (the dependent). Don't try to be
|
||||
# clever and replace this with sed code, as IRIX sed won't handle
|
||||
# lines with more than a fixed number of characters (4096 in
|
||||
# IRIX 6.2 sed, 8192 in IRIX 6.5). We also remove comment lines;
|
||||
# the IRIX cc adds comments like '#:fec' to the end of the
|
||||
# dependency line.
|
||||
tr ' ' "$nl" < "$tmpdepfile" \
|
||||
| sed -e 's/^.*\.o://' -e 's/#.*$//' -e '/^$/ d' \
|
||||
| tr "$nl" ' ' >> "$depfile"
|
||||
echo >> "$depfile"
|
||||
# The second pass generates a dummy entry for each header file.
|
||||
tr ' ' "$nl" < "$tmpdepfile" \
|
||||
| sed -e 's/^.*\.o://' -e 's/#.*$//' -e '/^$/ d' -e 's/$/:/' \
|
||||
>> "$depfile"
|
||||
else
|
||||
make_dummy_depfile
|
||||
fi
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
xlc)
|
||||
# This case exists only to let depend.m4 do its work. It works by
|
||||
# looking at the text of this script. This case will never be run,
|
||||
# since it is checked for above.
|
||||
exit 1
|
||||
;;
|
||||
|
||||
aix)
|
||||
# The C for AIX Compiler uses -M and outputs the dependencies
|
||||
# in a .u file. In older versions, this file always lives in the
|
||||
# current directory. Also, the AIX compiler puts '$object:' at the
|
||||
# start of each line; $object doesn't have directory information.
|
||||
# Version 6 uses the directory in both cases.
|
||||
set_dir_from "$object"
|
||||
set_base_from "$object"
|
||||
if test "$libtool" = yes; then
|
||||
tmpdepfile1=$dir$base.u
|
||||
tmpdepfile2=$base.u
|
||||
tmpdepfile3=$dir.libs/$base.u
|
||||
"$@" -Wc,-M
|
||||
else
|
||||
tmpdepfile1=$dir$base.u
|
||||
tmpdepfile2=$dir$base.u
|
||||
tmpdepfile3=$dir$base.u
|
||||
"$@" -M
|
||||
fi
|
||||
stat=$?
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile1" "$tmpdepfile2" "$tmpdepfile3"
|
||||
exit $stat
|
||||
fi
|
||||
|
||||
for tmpdepfile in "$tmpdepfile1" "$tmpdepfile2" "$tmpdepfile3"
|
||||
do
|
||||
test -f "$tmpdepfile" && break
|
||||
done
|
||||
aix_post_process_depfile
|
||||
;;
|
||||
|
||||
tcc)
|
||||
# tcc (Tiny C Compiler) understand '-MD -MF file' since version 0.9.26
|
||||
# FIXME: That version still under development at the moment of writing.
|
||||
# Make that this statement remains true also for stable, released
|
||||
# versions.
|
||||
# It will wrap lines (doesn't matter whether long or short) with a
|
||||
# trailing '\', as in:
|
||||
#
|
||||
# foo.o : \
|
||||
# foo.c \
|
||||
# foo.h \
|
||||
#
|
||||
# It will put a trailing '\' even on the last line, and will use leading
|
||||
# spaces rather than leading tabs (at least since its commit 0394caf7
|
||||
# "Emit spaces for -MD").
|
||||
"$@" -MD -MF "$tmpdepfile"
|
||||
stat=$?
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile"
|
||||
exit $stat
|
||||
fi
|
||||
rm -f "$depfile"
|
||||
# Each non-empty line is of the form 'foo.o : \' or ' dep.h \'.
|
||||
# We have to change lines of the first kind to '$object: \'.
|
||||
sed -e "s|.*:|$object :|" < "$tmpdepfile" > "$depfile"
|
||||
# And for each line of the second kind, we have to emit a 'dep.h:'
|
||||
# dummy dependency, to avoid the deleted-header problem.
|
||||
sed -n -e 's|^ *\(.*\) *\\$|\1:|p' < "$tmpdepfile" >> "$depfile"
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
## The order of this option in the case statement is important, since the
|
||||
## shell code in configure will try each of these formats in the order
|
||||
## listed in this file. A plain '-MD' option would be understood by many
|
||||
## compilers, so we must ensure this comes after the gcc and icc options.
|
||||
pgcc)
|
||||
# Portland's C compiler understands '-MD'.
|
||||
# Will always output deps to 'file.d' where file is the root name of the
|
||||
# source file under compilation, even if file resides in a subdirectory.
|
||||
# The object file name does not affect the name of the '.d' file.
|
||||
# pgcc 10.2 will output
|
||||
# foo.o: sub/foo.c sub/foo.h
|
||||
# and will wrap long lines using '\' :
|
||||
# foo.o: sub/foo.c ... \
|
||||
# sub/foo.h ... \
|
||||
# ...
|
||||
set_dir_from "$object"
|
||||
# Use the source, not the object, to determine the base name, since
|
||||
# that's sadly what pgcc will do too.
|
||||
set_base_from "$source"
|
||||
tmpdepfile=$base.d
|
||||
|
||||
# For projects that build the same source file twice into different object
|
||||
# files, the pgcc approach of using the *source* file root name can cause
|
||||
# problems in parallel builds. Use a locking strategy to avoid stomping on
|
||||
# the same $tmpdepfile.
|
||||
lockdir=$base.d-lock
|
||||
trap "
|
||||
echo '$0: caught signal, cleaning up...' >&2
|
||||
rmdir '$lockdir'
|
||||
exit 1
|
||||
" 1 2 13 15
|
||||
numtries=100
|
||||
i=$numtries
|
||||
while test $i -gt 0; do
|
||||
# mkdir is a portable test-and-set.
|
||||
if mkdir "$lockdir" 2>/dev/null; then
|
||||
# This process acquired the lock.
|
||||
"$@" -MD
|
||||
stat=$?
|
||||
# Release the lock.
|
||||
rmdir "$lockdir"
|
||||
break
|
||||
else
|
||||
# If the lock is being held by a different process, wait
|
||||
# until the winning process is done or we timeout.
|
||||
while test -d "$lockdir" && test $i -gt 0; do
|
||||
sleep 1
|
||||
i=`expr $i - 1`
|
||||
done
|
||||
fi
|
||||
i=`expr $i - 1`
|
||||
done
|
||||
trap - 1 2 13 15
|
||||
if test $i -le 0; then
|
||||
echo "$0: failed to acquire lock after $numtries attempts" >&2
|
||||
echo "$0: check lockdir '$lockdir'" >&2
|
||||
exit 1
|
||||
fi
|
||||
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile"
|
||||
exit $stat
|
||||
fi
|
||||
rm -f "$depfile"
|
||||
# Each line is of the form `foo.o: dependent.h',
|
||||
# or `foo.o: dep1.h dep2.h \', or ` dep3.h dep4.h \'.
|
||||
# Do two passes, one to just change these to
|
||||
# `$object: dependent.h' and one to simply `dependent.h:'.
|
||||
sed "s,^[^:]*:,$object :," < "$tmpdepfile" > "$depfile"
|
||||
# Some versions of the HPUX 10.20 sed can't process this invocation
|
||||
# correctly. Breaking it into two sed invocations is a workaround.
|
||||
sed 's,^[^:]*: \(.*\)$,\1,;s/^\\$//;/^$/d;/:$/d' < "$tmpdepfile" \
|
||||
| sed -e 's/$/ :/' >> "$depfile"
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
hp2)
|
||||
# The "hp" stanza above does not work with aCC (C++) and HP's ia64
|
||||
# compilers, which have integrated preprocessors. The correct option
|
||||
# to use with these is +Maked; it writes dependencies to a file named
|
||||
# 'foo.d', which lands next to the object file, wherever that
|
||||
# happens to be.
|
||||
# Much of this is similar to the tru64 case; see comments there.
|
||||
set_dir_from "$object"
|
||||
set_base_from "$object"
|
||||
if test "$libtool" = yes; then
|
||||
tmpdepfile1=$dir$base.d
|
||||
tmpdepfile2=$dir.libs/$base.d
|
||||
"$@" -Wc,+Maked
|
||||
else
|
||||
tmpdepfile1=$dir$base.d
|
||||
tmpdepfile2=$dir$base.d
|
||||
"$@" +Maked
|
||||
fi
|
||||
stat=$?
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile1" "$tmpdepfile2"
|
||||
exit $stat
|
||||
fi
|
||||
|
||||
for tmpdepfile in "$tmpdepfile1" "$tmpdepfile2"
|
||||
do
|
||||
test -f "$tmpdepfile" && break
|
||||
done
|
||||
if test -f "$tmpdepfile"; then
|
||||
sed -e "s,^.*\.[$lower]*:,$object:," "$tmpdepfile" > "$depfile"
|
||||
# Add 'dependent.h:' lines.
|
||||
sed -ne '2,${
|
||||
s/^ *//
|
||||
s/ \\*$//
|
||||
s/$/:/
|
||||
p
|
||||
}' "$tmpdepfile" >> "$depfile"
|
||||
else
|
||||
make_dummy_depfile
|
||||
fi
|
||||
rm -f "$tmpdepfile" "$tmpdepfile2"
|
||||
;;
|
||||
|
||||
tru64)
|
||||
# The Tru64 compiler uses -MD to generate dependencies as a side
|
||||
# effect. 'cc -MD -o foo.o ...' puts the dependencies into 'foo.o.d'.
|
||||
# At least on Alpha/Redhat 6.1, Compaq CCC V6.2-504 seems to put
|
||||
# dependencies in 'foo.d' instead, so we check for that too.
|
||||
# Subdirectories are respected.
|
||||
set_dir_from "$object"
|
||||
set_base_from "$object"
|
||||
|
||||
if test "$libtool" = yes; then
|
||||
# Libtool generates 2 separate objects for the 2 libraries. These
|
||||
# two compilations output dependencies in $dir.libs/$base.o.d and
|
||||
# in $dir$base.o.d. We have to check for both files, because
|
||||
# one of the two compilations can be disabled. We should prefer
|
||||
# $dir$base.o.d over $dir.libs/$base.o.d because the latter is
|
||||
# automatically cleaned when .libs/ is deleted, while ignoring
|
||||
# the former would cause a distcleancheck panic.
|
||||
tmpdepfile1=$dir$base.o.d # libtool 1.5
|
||||
tmpdepfile2=$dir.libs/$base.o.d # Likewise.
|
||||
tmpdepfile3=$dir.libs/$base.d # Compaq CCC V6.2-504
|
||||
"$@" -Wc,-MD
|
||||
else
|
||||
tmpdepfile1=$dir$base.d
|
||||
tmpdepfile2=$dir$base.d
|
||||
tmpdepfile3=$dir$base.d
|
||||
"$@" -MD
|
||||
fi
|
||||
|
||||
stat=$?
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile1" "$tmpdepfile2" "$tmpdepfile3"
|
||||
exit $stat
|
||||
fi
|
||||
|
||||
for tmpdepfile in "$tmpdepfile1" "$tmpdepfile2" "$tmpdepfile3"
|
||||
do
|
||||
test -f "$tmpdepfile" && break
|
||||
done
|
||||
# Same post-processing that is required for AIX mode.
|
||||
aix_post_process_depfile
|
||||
;;
|
||||
|
||||
msvc7)
|
||||
if test "$libtool" = yes; then
|
||||
showIncludes=-Wc,-showIncludes
|
||||
else
|
||||
showIncludes=-showIncludes
|
||||
fi
|
||||
"$@" $showIncludes > "$tmpdepfile"
|
||||
stat=$?
|
||||
grep -v '^Note: including file: ' "$tmpdepfile"
|
||||
if test $stat -ne 0; then
|
||||
rm -f "$tmpdepfile"
|
||||
exit $stat
|
||||
fi
|
||||
rm -f "$depfile"
|
||||
echo "$object : \\" > "$depfile"
|
||||
# The first sed program below extracts the file names and escapes
|
||||
# backslashes for cygpath. The second sed program outputs the file
|
||||
# name when reading, but also accumulates all include files in the
|
||||
# hold buffer in order to output them again at the end. This only
|
||||
# works with sed implementations that can handle large buffers.
|
||||
sed < "$tmpdepfile" -n '
|
||||
/^Note: including file: *\(.*\)/ {
|
||||
s//\1/
|
||||
s/\\/\\\\/g
|
||||
p
|
||||
}' | $cygpath_u | sort -u | sed -n '
|
||||
s/ /\\ /g
|
||||
s/\(.*\)/'"$tab"'\1 \\/p
|
||||
s/.\(.*\) \\/\1:/
|
||||
H
|
||||
$ {
|
||||
s/.*/'"$tab"'/
|
||||
G
|
||||
p
|
||||
}' >> "$depfile"
|
||||
echo >> "$depfile" # make sure the fragment doesn't end with a backslash
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
msvc7msys)
|
||||
# This case exists only to let depend.m4 do its work. It works by
|
||||
# looking at the text of this script. This case will never be run,
|
||||
# since it is checked for above.
|
||||
exit 1
|
||||
;;
|
||||
|
||||
#nosideeffect)
|
||||
# This comment above is used by automake to tell side-effect
|
||||
# dependency tracking mechanisms from slower ones.
|
||||
|
||||
dashmstdout)
|
||||
# Important note: in order to support this mode, a compiler *must*
|
||||
# always write the preprocessed file to stdout, regardless of -o.
|
||||
"$@" || exit $?
|
||||
|
||||
# Remove the call to Libtool.
|
||||
if test "$libtool" = yes; then
|
||||
while test "X$1" != 'X--mode=compile'; do
|
||||
shift
|
||||
done
|
||||
shift
|
||||
fi
|
||||
|
||||
# Remove '-o $object'.
|
||||
IFS=" "
|
||||
for arg
|
||||
do
|
||||
case $arg in
|
||||
-o)
|
||||
shift
|
||||
;;
|
||||
$object)
|
||||
shift
|
||||
;;
|
||||
*)
|
||||
set fnord "$@" "$arg"
|
||||
shift # fnord
|
||||
shift # $arg
|
||||
;;
|
||||
esac
|
||||
done
|
||||
|
||||
test -z "$dashmflag" && dashmflag=-M
|
||||
# Require at least two characters before searching for ':'
|
||||
# in the target name. This is to cope with DOS-style filenames:
|
||||
# a dependency such as 'c:/foo/bar' could be seen as target 'c' otherwise.
|
||||
"$@" $dashmflag |
|
||||
sed "s|^[$tab ]*[^:$tab ][^:][^:]*:[$tab ]*|$object: |" > "$tmpdepfile"
|
||||
rm -f "$depfile"
|
||||
cat < "$tmpdepfile" > "$depfile"
|
||||
# Some versions of the HPUX 10.20 sed can't process this sed invocation
|
||||
# correctly. Breaking it into two sed invocations is a workaround.
|
||||
tr ' ' "$nl" < "$tmpdepfile" \
|
||||
| sed -e 's/^\\$//' -e '/^$/d' -e '/:$/d' \
|
||||
| sed -e 's/$/ :/' >> "$depfile"
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
dashXmstdout)
|
||||
# This case only exists to satisfy depend.m4. It is never actually
|
||||
# run, as this mode is specially recognized in the preamble.
|
||||
exit 1
|
||||
;;
|
||||
|
||||
makedepend)
|
||||
"$@" || exit $?
|
||||
# Remove any Libtool call
|
||||
if test "$libtool" = yes; then
|
||||
while test "X$1" != 'X--mode=compile'; do
|
||||
shift
|
||||
done
|
||||
shift
|
||||
fi
|
||||
# X makedepend
|
||||
shift
|
||||
cleared=no eat=no
|
||||
for arg
|
||||
do
|
||||
case $cleared in
|
||||
no)
|
||||
set ""; shift
|
||||
cleared=yes ;;
|
||||
esac
|
||||
if test $eat = yes; then
|
||||
eat=no
|
||||
continue
|
||||
fi
|
||||
case "$arg" in
|
||||
-D*|-I*)
|
||||
set fnord "$@" "$arg"; shift ;;
|
||||
# Strip any option that makedepend may not understand. Remove
|
||||
# the object too, otherwise makedepend will parse it as a source file.
|
||||
-arch)
|
||||
eat=yes ;;
|
||||
-*|$object)
|
||||
;;
|
||||
*)
|
||||
set fnord "$@" "$arg"; shift ;;
|
||||
esac
|
||||
done
|
||||
obj_suffix=`echo "$object" | sed 's/^.*\././'`
|
||||
touch "$tmpdepfile"
|
||||
${MAKEDEPEND-makedepend} -o"$obj_suffix" -f"$tmpdepfile" "$@"
|
||||
rm -f "$depfile"
|
||||
# makedepend may prepend the VPATH from the source file name to the object.
|
||||
# No need to regex-escape $object, excess matching of '.' is harmless.
|
||||
sed "s|^.*\($object *:\)|\1|" "$tmpdepfile" > "$depfile"
|
||||
# Some versions of the HPUX 10.20 sed can't process the last invocation
|
||||
# correctly. Breaking it into two sed invocations is a workaround.
|
||||
sed '1,2d' "$tmpdepfile" \
|
||||
| tr ' ' "$nl" \
|
||||
| sed -e 's/^\\$//' -e '/^$/d' -e '/:$/d' \
|
||||
| sed -e 's/$/ :/' >> "$depfile"
|
||||
rm -f "$tmpdepfile" "$tmpdepfile".bak
|
||||
;;
|
||||
|
||||
cpp)
|
||||
# Important note: in order to support this mode, a compiler *must*
|
||||
# always write the preprocessed file to stdout.
|
||||
"$@" || exit $?
|
||||
|
||||
# Remove the call to Libtool.
|
||||
if test "$libtool" = yes; then
|
||||
while test "X$1" != 'X--mode=compile'; do
|
||||
shift
|
||||
done
|
||||
shift
|
||||
fi
|
||||
|
||||
# Remove '-o $object'.
|
||||
IFS=" "
|
||||
for arg
|
||||
do
|
||||
case $arg in
|
||||
-o)
|
||||
shift
|
||||
;;
|
||||
$object)
|
||||
shift
|
||||
;;
|
||||
*)
|
||||
set fnord "$@" "$arg"
|
||||
shift # fnord
|
||||
shift # $arg
|
||||
;;
|
||||
esac
|
||||
done
|
||||
|
||||
"$@" -E \
|
||||
| sed -n -e '/^# [0-9][0-9]* "\([^"]*\)".*/ s:: \1 \\:p' \
|
||||
-e '/^#line [0-9][0-9]* "\([^"]*\)".*/ s:: \1 \\:p' \
|
||||
| sed '$ s: \\$::' > "$tmpdepfile"
|
||||
rm -f "$depfile"
|
||||
echo "$object : \\" > "$depfile"
|
||||
cat < "$tmpdepfile" >> "$depfile"
|
||||
sed < "$tmpdepfile" '/^$/d;s/^ //;s/ \\$//;s/$/ :/' >> "$depfile"
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
msvisualcpp)
|
||||
# Important note: in order to support this mode, a compiler *must*
|
||||
# always write the preprocessed file to stdout.
|
||||
"$@" || exit $?
|
||||
|
||||
# Remove the call to Libtool.
|
||||
if test "$libtool" = yes; then
|
||||
while test "X$1" != 'X--mode=compile'; do
|
||||
shift
|
||||
done
|
||||
shift
|
||||
fi
|
||||
|
||||
IFS=" "
|
||||
for arg
|
||||
do
|
||||
case "$arg" in
|
||||
-o)
|
||||
shift
|
||||
;;
|
||||
$object)
|
||||
shift
|
||||
;;
|
||||
"-Gm"|"/Gm"|"-Gi"|"/Gi"|"-ZI"|"/ZI")
|
||||
set fnord "$@"
|
||||
shift
|
||||
shift
|
||||
;;
|
||||
*)
|
||||
set fnord "$@" "$arg"
|
||||
shift
|
||||
shift
|
||||
;;
|
||||
esac
|
||||
done
|
||||
"$@" -E 2>/dev/null |
|
||||
sed -n '/^#line [0-9][0-9]* "\([^"]*\)"/ s::\1:p' | $cygpath_u | sort -u > "$tmpdepfile"
|
||||
rm -f "$depfile"
|
||||
echo "$object : \\" > "$depfile"
|
||||
sed < "$tmpdepfile" -n -e 's% %\\ %g' -e '/^\(.*\)$/ s::'"$tab"'\1 \\:p' >> "$depfile"
|
||||
echo "$tab" >> "$depfile"
|
||||
sed < "$tmpdepfile" -n -e 's% %\\ %g' -e '/^\(.*\)$/ s::\1\::p' >> "$depfile"
|
||||
rm -f "$tmpdepfile"
|
||||
;;
|
||||
|
||||
msvcmsys)
|
||||
# This case exists only to let depend.m4 do its work. It works by
|
||||
# looking at the text of this script. This case will never be run,
|
||||
# since it is checked for above.
|
||||
exit 1
|
||||
;;
|
||||
|
||||
none)
|
||||
exec "$@"
|
||||
;;
|
||||
|
||||
*)
|
||||
echo "Unknown depmode $depmode" 1>&2
|
||||
exit 1
|
||||
;;
|
||||
esac
|
||||
|
||||
exit 0
|
||||
|
||||
# Local Variables:
|
||||
# mode: shell-script
|
||||
# sh-indentation: 2
|
||||
# eval: (add-hook 'write-file-hooks 'time-stamp)
|
||||
# time-stamp-start: "scriptversion="
|
||||
# time-stamp-format: "%:y-%02m-%02d.%02H"
|
||||
# time-stamp-time-zone: "UTC"
|
||||
# time-stamp-end: "; # UTC"
|
||||
# End:
|
|
@ -1,7 +1,7 @@
|
|||
# GF-Complete 'examples' AM file
|
||||
|
||||
INCLUDES=-I./ -I../include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
AM_CPPFLAGS = -I$(top_builddir)/include -I$(top_srcdir)/include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC
|
||||
|
||||
bin_PROGRAMS = gf_example_1 gf_example_2 gf_example_3 gf_example_4 \
|
||||
gf_example_5 gf_example_6 gf_example_7
|
||||
|
|
|
@ -1,698 +0,0 @@
|
|||
# Makefile.in generated by automake 1.14.1 from Makefile.am.
|
||||
# @configure_input@
|
||||
|
||||
# Copyright (C) 1994-2013 Free Software Foundation, Inc.
|
||||
|
||||
# This Makefile.in is free software; the Free Software Foundation
|
||||
# gives unlimited permission to copy and/or distribute it,
|
||||
# with or without modifications, as long as this notice is preserved.
|
||||
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY, to the extent permitted by law; without
|
||||
# even the implied warranty of MERCHANTABILITY or FITNESS FOR A
|
||||
# PARTICULAR PURPOSE.
|
||||
|
||||
@SET_MAKE@
|
||||
|
||||
# GF-Complete 'examples' AM file
|
||||
|
||||
VPATH = @srcdir@
|
||||
am__is_gnu_make = test -n '$(MAKEFILE_LIST)' && test -n '$(MAKELEVEL)'
|
||||
am__make_running_with_option = \
|
||||
case $${target_option-} in \
|
||||
?) ;; \
|
||||
*) echo "am__make_running_with_option: internal error: invalid" \
|
||||
"target option '$${target_option-}' specified" >&2; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
has_opt=no; \
|
||||
sane_makeflags=$$MAKEFLAGS; \
|
||||
if $(am__is_gnu_make); then \
|
||||
sane_makeflags=$$MFLAGS; \
|
||||
else \
|
||||
case $$MAKEFLAGS in \
|
||||
*\\[\ \ ]*) \
|
||||
bs=\\; \
|
||||
sane_makeflags=`printf '%s\n' "$$MAKEFLAGS" \
|
||||
| sed "s/$$bs$$bs[$$bs $$bs ]*//g"`;; \
|
||||
esac; \
|
||||
fi; \
|
||||
skip_next=no; \
|
||||
strip_trailopt () \
|
||||
{ \
|
||||
flg=`printf '%s\n' "$$flg" | sed "s/$$1.*$$//"`; \
|
||||
}; \
|
||||
for flg in $$sane_makeflags; do \
|
||||
test $$skip_next = yes && { skip_next=no; continue; }; \
|
||||
case $$flg in \
|
||||
*=*|--*) continue;; \
|
||||
-*I) strip_trailopt 'I'; skip_next=yes;; \
|
||||
-*I?*) strip_trailopt 'I';; \
|
||||
-*O) strip_trailopt 'O'; skip_next=yes;; \
|
||||
-*O?*) strip_trailopt 'O';; \
|
||||
-*l) strip_trailopt 'l'; skip_next=yes;; \
|
||||
-*l?*) strip_trailopt 'l';; \
|
||||
-[dEDm]) skip_next=yes;; \
|
||||
-[JT]) skip_next=yes;; \
|
||||
esac; \
|
||||
case $$flg in \
|
||||
*$$target_option*) has_opt=yes; break;; \
|
||||
esac; \
|
||||
done; \
|
||||
test $$has_opt = yes
|
||||
am__make_dryrun = (target_option=n; $(am__make_running_with_option))
|
||||
am__make_keepgoing = (target_option=k; $(am__make_running_with_option))
|
||||
pkgdatadir = $(datadir)/@PACKAGE@
|
||||
pkgincludedir = $(includedir)/@PACKAGE@
|
||||
pkglibdir = $(libdir)/@PACKAGE@
|
||||
pkglibexecdir = $(libexecdir)/@PACKAGE@
|
||||
am__cd = CDPATH="$${ZSH_VERSION+.}$(PATH_SEPARATOR)" && cd
|
||||
install_sh_DATA = $(install_sh) -c -m 644
|
||||
install_sh_PROGRAM = $(install_sh) -c
|
||||
install_sh_SCRIPT = $(install_sh) -c
|
||||
INSTALL_HEADER = $(INSTALL_DATA)
|
||||
transform = $(program_transform_name)
|
||||
NORMAL_INSTALL = :
|
||||
PRE_INSTALL = :
|
||||
POST_INSTALL = :
|
||||
NORMAL_UNINSTALL = :
|
||||
PRE_UNINSTALL = :
|
||||
POST_UNINSTALL = :
|
||||
build_triplet = @build@
|
||||
host_triplet = @host@
|
||||
bin_PROGRAMS = gf_example_1$(EXEEXT) gf_example_2$(EXEEXT) \
|
||||
gf_example_3$(EXEEXT) gf_example_4$(EXEEXT) \
|
||||
gf_example_5$(EXEEXT) gf_example_6$(EXEEXT) \
|
||||
gf_example_7$(EXEEXT)
|
||||
subdir = examples
|
||||
DIST_COMMON = $(srcdir)/Makefile.in $(srcdir)/Makefile.am \
|
||||
$(top_srcdir)/depcomp
|
||||
ACLOCAL_M4 = $(top_srcdir)/aclocal.m4
|
||||
am__aclocal_m4_deps = $(top_srcdir)/m4/ax_check_compile_flag.m4 \
|
||||
$(top_srcdir)/m4/ax_ext.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_avx_xgetbv.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_cpuid.m4 \
|
||||
$(top_srcdir)/m4/libtool.m4 $(top_srcdir)/m4/ltoptions.m4 \
|
||||
$(top_srcdir)/m4/ltsugar.m4 $(top_srcdir)/m4/ltversion.m4 \
|
||||
$(top_srcdir)/m4/lt~obsolete.m4 $(top_srcdir)/configure.ac
|
||||
am__configure_deps = $(am__aclocal_m4_deps) $(CONFIGURE_DEPENDENCIES) \
|
||||
$(ACLOCAL_M4)
|
||||
mkinstalldirs = $(install_sh) -d
|
||||
CONFIG_HEADER = $(top_builddir)/include/config.h
|
||||
CONFIG_CLEAN_FILES =
|
||||
CONFIG_CLEAN_VPATH_FILES =
|
||||
am__installdirs = "$(DESTDIR)$(bindir)"
|
||||
PROGRAMS = $(bin_PROGRAMS)
|
||||
am_gf_example_1_OBJECTS = gf_example_1.$(OBJEXT)
|
||||
gf_example_1_OBJECTS = $(am_gf_example_1_OBJECTS)
|
||||
gf_example_1_DEPENDENCIES = ../src/libgf_complete.la
|
||||
AM_V_lt = $(am__v_lt_@AM_V@)
|
||||
am__v_lt_ = $(am__v_lt_@AM_DEFAULT_V@)
|
||||
am__v_lt_0 = --silent
|
||||
am__v_lt_1 =
|
||||
am_gf_example_2_OBJECTS = gf_example_2.$(OBJEXT)
|
||||
gf_example_2_OBJECTS = $(am_gf_example_2_OBJECTS)
|
||||
gf_example_2_DEPENDENCIES = ../src/libgf_complete.la
|
||||
am_gf_example_3_OBJECTS = gf_example_3.$(OBJEXT)
|
||||
gf_example_3_OBJECTS = $(am_gf_example_3_OBJECTS)
|
||||
gf_example_3_DEPENDENCIES = ../src/libgf_complete.la
|
||||
am_gf_example_4_OBJECTS = gf_example_4.$(OBJEXT)
|
||||
gf_example_4_OBJECTS = $(am_gf_example_4_OBJECTS)
|
||||
gf_example_4_DEPENDENCIES = ../src/libgf_complete.la
|
||||
am_gf_example_5_OBJECTS = gf_example_5.$(OBJEXT)
|
||||
gf_example_5_OBJECTS = $(am_gf_example_5_OBJECTS)
|
||||
gf_example_5_DEPENDENCIES = ../src/libgf_complete.la
|
||||
am_gf_example_6_OBJECTS = gf_example_6.$(OBJEXT)
|
||||
gf_example_6_OBJECTS = $(am_gf_example_6_OBJECTS)
|
||||
gf_example_6_DEPENDENCIES = ../src/libgf_complete.la
|
||||
am_gf_example_7_OBJECTS = gf_example_7.$(OBJEXT)
|
||||
gf_example_7_OBJECTS = $(am_gf_example_7_OBJECTS)
|
||||
gf_example_7_DEPENDENCIES = ../src/libgf_complete.la
|
||||
AM_V_P = $(am__v_P_@AM_V@)
|
||||
am__v_P_ = $(am__v_P_@AM_DEFAULT_V@)
|
||||
am__v_P_0 = false
|
||||
am__v_P_1 = :
|
||||
AM_V_GEN = $(am__v_GEN_@AM_V@)
|
||||
am__v_GEN_ = $(am__v_GEN_@AM_DEFAULT_V@)
|
||||
am__v_GEN_0 = @echo " GEN " $@;
|
||||
am__v_GEN_1 =
|
||||
AM_V_at = $(am__v_at_@AM_V@)
|
||||
am__v_at_ = $(am__v_at_@AM_DEFAULT_V@)
|
||||
am__v_at_0 = @
|
||||
am__v_at_1 =
|
||||
DEFAULT_INCLUDES = -I.@am__isrc@ -I$(top_builddir)/include
|
||||
depcomp = $(SHELL) $(top_srcdir)/depcomp
|
||||
am__depfiles_maybe = depfiles
|
||||
am__mv = mv -f
|
||||
COMPILE = $(CC) $(DEFS) $(DEFAULT_INCLUDES) $(INCLUDES) $(AM_CPPFLAGS) \
|
||||
$(CPPFLAGS) $(AM_CFLAGS) $(CFLAGS)
|
||||
LTCOMPILE = $(LIBTOOL) $(AM_V_lt) --tag=CC $(AM_LIBTOOLFLAGS) \
|
||||
$(LIBTOOLFLAGS) --mode=compile $(CC) $(DEFS) \
|
||||
$(DEFAULT_INCLUDES) $(INCLUDES) $(AM_CPPFLAGS) $(CPPFLAGS) \
|
||||
$(AM_CFLAGS) $(CFLAGS)
|
||||
AM_V_CC = $(am__v_CC_@AM_V@)
|
||||
am__v_CC_ = $(am__v_CC_@AM_DEFAULT_V@)
|
||||
am__v_CC_0 = @echo " CC " $@;
|
||||
am__v_CC_1 =
|
||||
CCLD = $(CC)
|
||||
LINK = $(LIBTOOL) $(AM_V_lt) --tag=CC $(AM_LIBTOOLFLAGS) \
|
||||
$(LIBTOOLFLAGS) --mode=link $(CCLD) $(AM_CFLAGS) $(CFLAGS) \
|
||||
$(AM_LDFLAGS) $(LDFLAGS) -o $@
|
||||
AM_V_CCLD = $(am__v_CCLD_@AM_V@)
|
||||
am__v_CCLD_ = $(am__v_CCLD_@AM_DEFAULT_V@)
|
||||
am__v_CCLD_0 = @echo " CCLD " $@;
|
||||
am__v_CCLD_1 =
|
||||
SOURCES = $(gf_example_1_SOURCES) $(gf_example_2_SOURCES) \
|
||||
$(gf_example_3_SOURCES) $(gf_example_4_SOURCES) \
|
||||
$(gf_example_5_SOURCES) $(gf_example_6_SOURCES) \
|
||||
$(gf_example_7_SOURCES)
|
||||
DIST_SOURCES = $(gf_example_1_SOURCES) $(gf_example_2_SOURCES) \
|
||||
$(gf_example_3_SOURCES) $(gf_example_4_SOURCES) \
|
||||
$(gf_example_5_SOURCES) $(gf_example_6_SOURCES) \
|
||||
$(gf_example_7_SOURCES)
|
||||
am__can_run_installinfo = \
|
||||
case $$AM_UPDATE_INFO_DIR in \
|
||||
n|no|NO) false;; \
|
||||
*) (install-info --version) >/dev/null 2>&1;; \
|
||||
esac
|
||||
am__tagged_files = $(HEADERS) $(SOURCES) $(TAGS_FILES) $(LISP)
|
||||
# Read a list of newline-separated strings from the standard input,
|
||||
# and print each of them once, without duplicates. Input order is
|
||||
# *not* preserved.
|
||||
am__uniquify_input = $(AWK) '\
|
||||
BEGIN { nonempty = 0; } \
|
||||
{ items[$$0] = 1; nonempty = 1; } \
|
||||
END { if (nonempty) { for (i in items) print i; }; } \
|
||||
'
|
||||
# Make sure the list of sources is unique. This is necessary because,
|
||||
# e.g., the same source file might be shared among _SOURCES variables
|
||||
# for different programs/libraries.
|
||||
am__define_uniq_tagged_files = \
|
||||
list='$(am__tagged_files)'; \
|
||||
unique=`for i in $$list; do \
|
||||
if test -f "$$i"; then echo $$i; else echo $(srcdir)/$$i; fi; \
|
||||
done | $(am__uniquify_input)`
|
||||
ETAGS = etags
|
||||
CTAGS = ctags
|
||||
DISTFILES = $(DIST_COMMON) $(DIST_SOURCES) $(TEXINFOS) $(EXTRA_DIST)
|
||||
ACLOCAL = @ACLOCAL@
|
||||
AMTAR = @AMTAR@
|
||||
AM_DEFAULT_VERBOSITY = @AM_DEFAULT_VERBOSITY@
|
||||
AR = @AR@
|
||||
AUTOCONF = @AUTOCONF@
|
||||
AUTOHEADER = @AUTOHEADER@
|
||||
AUTOMAKE = @AUTOMAKE@
|
||||
AWK = @AWK@
|
||||
CC = @CC@
|
||||
CCDEPMODE = @CCDEPMODE@
|
||||
CFLAGS = @CFLAGS@
|
||||
CPP = @CPP@
|
||||
CPPFLAGS = @CPPFLAGS@
|
||||
CYGPATH_W = @CYGPATH_W@
|
||||
DEFS = @DEFS@
|
||||
DEPDIR = @DEPDIR@
|
||||
DLLTOOL = @DLLTOOL@
|
||||
DSYMUTIL = @DSYMUTIL@
|
||||
DUMPBIN = @DUMPBIN@
|
||||
ECHO_C = @ECHO_C@
|
||||
ECHO_N = @ECHO_N@
|
||||
ECHO_T = @ECHO_T@
|
||||
EGREP = @EGREP@
|
||||
EXEEXT = @EXEEXT@
|
||||
FGREP = @FGREP@
|
||||
GREP = @GREP@
|
||||
INSTALL = @INSTALL@
|
||||
INSTALL_DATA = @INSTALL_DATA@
|
||||
INSTALL_PROGRAM = @INSTALL_PROGRAM@
|
||||
INSTALL_SCRIPT = @INSTALL_SCRIPT@
|
||||
INSTALL_STRIP_PROGRAM = @INSTALL_STRIP_PROGRAM@
|
||||
LD = @LD@
|
||||
LDFLAGS = @LDFLAGS@
|
||||
LIBOBJS = @LIBOBJS@
|
||||
LIBS = @LIBS@
|
||||
LIBTOOL = @LIBTOOL@
|
||||
LIPO = @LIPO@
|
||||
LN_S = @LN_S@
|
||||
LTLIBOBJS = @LTLIBOBJS@
|
||||
MAINT = @MAINT@
|
||||
MAKEINFO = @MAKEINFO@
|
||||
MANIFEST_TOOL = @MANIFEST_TOOL@
|
||||
MKDIR_P = @MKDIR_P@
|
||||
NM = @NM@
|
||||
NMEDIT = @NMEDIT@
|
||||
OBJDUMP = @OBJDUMP@
|
||||
OBJEXT = @OBJEXT@
|
||||
OTOOL = @OTOOL@
|
||||
OTOOL64 = @OTOOL64@
|
||||
PACKAGE = @PACKAGE@
|
||||
PACKAGE_BUGREPORT = @PACKAGE_BUGREPORT@
|
||||
PACKAGE_NAME = @PACKAGE_NAME@
|
||||
PACKAGE_STRING = @PACKAGE_STRING@
|
||||
PACKAGE_TARNAME = @PACKAGE_TARNAME@
|
||||
PACKAGE_URL = @PACKAGE_URL@
|
||||
PACKAGE_VERSION = @PACKAGE_VERSION@
|
||||
PATH_SEPARATOR = @PATH_SEPARATOR@
|
||||
RANLIB = @RANLIB@
|
||||
SED = @SED@
|
||||
SET_MAKE = @SET_MAKE@
|
||||
SHELL = @SHELL@
|
||||
SIMD_FLAGS = @SIMD_FLAGS@
|
||||
STRIP = @STRIP@
|
||||
VERSION = @VERSION@
|
||||
abs_builddir = @abs_builddir@
|
||||
abs_srcdir = @abs_srcdir@
|
||||
abs_top_builddir = @abs_top_builddir@
|
||||
abs_top_srcdir = @abs_top_srcdir@
|
||||
ac_ct_AR = @ac_ct_AR@
|
||||
ac_ct_CC = @ac_ct_CC@
|
||||
ac_ct_DUMPBIN = @ac_ct_DUMPBIN@
|
||||
am__include = @am__include@
|
||||
am__leading_dot = @am__leading_dot@
|
||||
am__quote = @am__quote@
|
||||
am__tar = @am__tar@
|
||||
am__untar = @am__untar@
|
||||
bindir = @bindir@
|
||||
build = @build@
|
||||
build_alias = @build_alias@
|
||||
build_cpu = @build_cpu@
|
||||
build_os = @build_os@
|
||||
build_vendor = @build_vendor@
|
||||
builddir = @builddir@
|
||||
datadir = @datadir@
|
||||
datarootdir = @datarootdir@
|
||||
docdir = @docdir@
|
||||
dvidir = @dvidir@
|
||||
exec_prefix = @exec_prefix@
|
||||
host = @host@
|
||||
host_alias = @host_alias@
|
||||
host_cpu = @host_cpu@
|
||||
host_os = @host_os@
|
||||
host_vendor = @host_vendor@
|
||||
htmldir = @htmldir@
|
||||
includedir = @includedir@
|
||||
infodir = @infodir@
|
||||
install_sh = @install_sh@
|
||||
libdir = @libdir@
|
||||
libexecdir = @libexecdir@
|
||||
localedir = @localedir@
|
||||
localstatedir = @localstatedir@
|
||||
mandir = @mandir@
|
||||
mkdir_p = @mkdir_p@
|
||||
oldincludedir = @oldincludedir@
|
||||
pdfdir = @pdfdir@
|
||||
prefix = @prefix@
|
||||
program_transform_name = @program_transform_name@
|
||||
psdir = @psdir@
|
||||
sbindir = @sbindir@
|
||||
sharedstatedir = @sharedstatedir@
|
||||
srcdir = @srcdir@
|
||||
sysconfdir = @sysconfdir@
|
||||
target_alias = @target_alias@
|
||||
top_build_prefix = @top_build_prefix@
|
||||
top_builddir = @top_builddir@
|
||||
top_srcdir = @top_srcdir@
|
||||
INCLUDES = -I./ -I../include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
gf_example_1_SOURCES = gf_example_1.c
|
||||
#gf_example_1_LDFLAGS = -lgf_complete
|
||||
gf_example_1_LDADD = ../src/libgf_complete.la
|
||||
gf_example_2_SOURCES = gf_example_2.c
|
||||
#gf_example_2_LDFLAGS = -lgf_complete
|
||||
gf_example_2_LDADD = ../src/libgf_complete.la
|
||||
gf_example_3_SOURCES = gf_example_3.c
|
||||
#gf_example_3_LDFLAGS = -lgf_complete
|
||||
gf_example_3_LDADD = ../src/libgf_complete.la
|
||||
gf_example_4_SOURCES = gf_example_4.c
|
||||
#gf_example_4_LDFLAGS = -lgf_complete
|
||||
gf_example_4_LDADD = ../src/libgf_complete.la
|
||||
gf_example_5_SOURCES = gf_example_5.c
|
||||
#gf_example_5_LDFLAGS = -lgf_complete
|
||||
gf_example_5_LDADD = ../src/libgf_complete.la
|
||||
gf_example_6_SOURCES = gf_example_6.c
|
||||
#gf_example_6_LDFLAGS = -lgf_complete
|
||||
gf_example_6_LDADD = ../src/libgf_complete.la
|
||||
gf_example_7_SOURCES = gf_example_7.c
|
||||
#gf_example_7_LDFLAGS = -lgf_complete
|
||||
gf_example_7_LDADD = ../src/libgf_complete.la
|
||||
all: all-am
|
||||
|
||||
.SUFFIXES:
|
||||
.SUFFIXES: .c .lo .o .obj
|
||||
$(srcdir)/Makefile.in: @MAINTAINER_MODE_TRUE@ $(srcdir)/Makefile.am $(am__configure_deps)
|
||||
@for dep in $?; do \
|
||||
case '$(am__configure_deps)' in \
|
||||
*$$dep*) \
|
||||
( cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh ) \
|
||||
&& { if test -f $@; then exit 0; else break; fi; }; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
done; \
|
||||
echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu examples/Makefile'; \
|
||||
$(am__cd) $(top_srcdir) && \
|
||||
$(AUTOMAKE) --gnu examples/Makefile
|
||||
.PRECIOUS: Makefile
|
||||
Makefile: $(srcdir)/Makefile.in $(top_builddir)/config.status
|
||||
@case '$?' in \
|
||||
*config.status*) \
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh;; \
|
||||
*) \
|
||||
echo ' cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe)'; \
|
||||
cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe);; \
|
||||
esac;
|
||||
|
||||
$(top_builddir)/config.status: $(top_srcdir)/configure $(CONFIG_STATUS_DEPENDENCIES)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
|
||||
$(top_srcdir)/configure: @MAINTAINER_MODE_TRUE@ $(am__configure_deps)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
$(ACLOCAL_M4): @MAINTAINER_MODE_TRUE@ $(am__aclocal_m4_deps)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
$(am__aclocal_m4_deps):
|
||||
install-binPROGRAMS: $(bin_PROGRAMS)
|
||||
@$(NORMAL_INSTALL)
|
||||
@list='$(bin_PROGRAMS)'; test -n "$(bindir)" || list=; \
|
||||
if test -n "$$list"; then \
|
||||
echo " $(MKDIR_P) '$(DESTDIR)$(bindir)'"; \
|
||||
$(MKDIR_P) "$(DESTDIR)$(bindir)" || exit 1; \
|
||||
fi; \
|
||||
for p in $$list; do echo "$$p $$p"; done | \
|
||||
sed 's/$(EXEEXT)$$//' | \
|
||||
while read p p1; do if test -f $$p \
|
||||
|| test -f $$p1 \
|
||||
; then echo "$$p"; echo "$$p"; else :; fi; \
|
||||
done | \
|
||||
sed -e 'p;s,.*/,,;n;h' \
|
||||
-e 's|.*|.|' \
|
||||
-e 'p;x;s,.*/,,;s/$(EXEEXT)$$//;$(transform);s/$$/$(EXEEXT)/' | \
|
||||
sed 'N;N;N;s,\n, ,g' | \
|
||||
$(AWK) 'BEGIN { files["."] = ""; dirs["."] = 1 } \
|
||||
{ d=$$3; if (dirs[d] != 1) { print "d", d; dirs[d] = 1 } \
|
||||
if ($$2 == $$4) files[d] = files[d] " " $$1; \
|
||||
else { print "f", $$3 "/" $$4, $$1; } } \
|
||||
END { for (d in files) print "f", d, files[d] }' | \
|
||||
while read type dir files; do \
|
||||
if test "$$dir" = .; then dir=; else dir=/$$dir; fi; \
|
||||
test -z "$$files" || { \
|
||||
echo " $(INSTALL_PROGRAM_ENV) $(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=install $(INSTALL_PROGRAM) $$files '$(DESTDIR)$(bindir)$$dir'"; \
|
||||
$(INSTALL_PROGRAM_ENV) $(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=install $(INSTALL_PROGRAM) $$files "$(DESTDIR)$(bindir)$$dir" || exit $$?; \
|
||||
} \
|
||||
; done
|
||||
|
||||
uninstall-binPROGRAMS:
|
||||
@$(NORMAL_UNINSTALL)
|
||||
@list='$(bin_PROGRAMS)'; test -n "$(bindir)" || list=; \
|
||||
files=`for p in $$list; do echo "$$p"; done | \
|
||||
sed -e 'h;s,^.*/,,;s/$(EXEEXT)$$//;$(transform)' \
|
||||
-e 's/$$/$(EXEEXT)/' \
|
||||
`; \
|
||||
test -n "$$list" || exit 0; \
|
||||
echo " ( cd '$(DESTDIR)$(bindir)' && rm -f" $$files ")"; \
|
||||
cd "$(DESTDIR)$(bindir)" && rm -f $$files
|
||||
|
||||
clean-binPROGRAMS:
|
||||
@list='$(bin_PROGRAMS)'; test -n "$$list" || exit 0; \
|
||||
echo " rm -f" $$list; \
|
||||
rm -f $$list || exit $$?; \
|
||||
test -n "$(EXEEXT)" || exit 0; \
|
||||
list=`for p in $$list; do echo "$$p"; done | sed 's/$(EXEEXT)$$//'`; \
|
||||
echo " rm -f" $$list; \
|
||||
rm -f $$list
|
||||
|
||||
gf_example_1$(EXEEXT): $(gf_example_1_OBJECTS) $(gf_example_1_DEPENDENCIES) $(EXTRA_gf_example_1_DEPENDENCIES)
|
||||
@rm -f gf_example_1$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_example_1_OBJECTS) $(gf_example_1_LDADD) $(LIBS)
|
||||
|
||||
gf_example_2$(EXEEXT): $(gf_example_2_OBJECTS) $(gf_example_2_DEPENDENCIES) $(EXTRA_gf_example_2_DEPENDENCIES)
|
||||
@rm -f gf_example_2$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_example_2_OBJECTS) $(gf_example_2_LDADD) $(LIBS)
|
||||
|
||||
gf_example_3$(EXEEXT): $(gf_example_3_OBJECTS) $(gf_example_3_DEPENDENCIES) $(EXTRA_gf_example_3_DEPENDENCIES)
|
||||
@rm -f gf_example_3$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_example_3_OBJECTS) $(gf_example_3_LDADD) $(LIBS)
|
||||
|
||||
gf_example_4$(EXEEXT): $(gf_example_4_OBJECTS) $(gf_example_4_DEPENDENCIES) $(EXTRA_gf_example_4_DEPENDENCIES)
|
||||
@rm -f gf_example_4$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_example_4_OBJECTS) $(gf_example_4_LDADD) $(LIBS)
|
||||
|
||||
gf_example_5$(EXEEXT): $(gf_example_5_OBJECTS) $(gf_example_5_DEPENDENCIES) $(EXTRA_gf_example_5_DEPENDENCIES)
|
||||
@rm -f gf_example_5$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_example_5_OBJECTS) $(gf_example_5_LDADD) $(LIBS)
|
||||
|
||||
gf_example_6$(EXEEXT): $(gf_example_6_OBJECTS) $(gf_example_6_DEPENDENCIES) $(EXTRA_gf_example_6_DEPENDENCIES)
|
||||
@rm -f gf_example_6$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_example_6_OBJECTS) $(gf_example_6_LDADD) $(LIBS)
|
||||
|
||||
gf_example_7$(EXEEXT): $(gf_example_7_OBJECTS) $(gf_example_7_DEPENDENCIES) $(EXTRA_gf_example_7_DEPENDENCIES)
|
||||
@rm -f gf_example_7$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_example_7_OBJECTS) $(gf_example_7_LDADD) $(LIBS)
|
||||
|
||||
mostlyclean-compile:
|
||||
-rm -f *.$(OBJEXT)
|
||||
|
||||
distclean-compile:
|
||||
-rm -f *.tab.c
|
||||
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_example_1.Po@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_example_2.Po@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_example_3.Po@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_example_4.Po@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_example_5.Po@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_example_6.Po@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_example_7.Po@am__quote@
|
||||
|
||||
.c.o:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(COMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ $<
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Po
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=no @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(COMPILE) -c -o $@ $<
|
||||
|
||||
.c.obj:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(COMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ `$(CYGPATH_W) '$<'`
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Po
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=no @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(COMPILE) -c -o $@ `$(CYGPATH_W) '$<'`
|
||||
|
||||
.c.lo:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(LTCOMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ $<
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Plo
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=yes @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(LTCOMPILE) -c -o $@ $<
|
||||
|
||||
mostlyclean-libtool:
|
||||
-rm -f *.lo
|
||||
|
||||
clean-libtool:
|
||||
-rm -rf .libs _libs
|
||||
|
||||
ID: $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); mkid -fID $$unique
|
||||
tags: tags-am
|
||||
TAGS: tags
|
||||
|
||||
tags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
set x; \
|
||||
here=`pwd`; \
|
||||
$(am__define_uniq_tagged_files); \
|
||||
shift; \
|
||||
if test -z "$(ETAGS_ARGS)$$*$$unique"; then :; else \
|
||||
test -n "$$unique" || unique=$$empty_fix; \
|
||||
if test $$# -gt 0; then \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
"$$@" $$unique; \
|
||||
else \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
$$unique; \
|
||||
fi; \
|
||||
fi
|
||||
ctags: ctags-am
|
||||
|
||||
CTAGS: ctags
|
||||
ctags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); \
|
||||
test -z "$(CTAGS_ARGS)$$unique" \
|
||||
|| $(CTAGS) $(CTAGSFLAGS) $(AM_CTAGSFLAGS) $(CTAGS_ARGS) \
|
||||
$$unique
|
||||
|
||||
GTAGS:
|
||||
here=`$(am__cd) $(top_builddir) && pwd` \
|
||||
&& $(am__cd) $(top_srcdir) \
|
||||
&& gtags -i $(GTAGS_ARGS) "$$here"
|
||||
cscopelist: cscopelist-am
|
||||
|
||||
cscopelist-am: $(am__tagged_files)
|
||||
list='$(am__tagged_files)'; \
|
||||
case "$(srcdir)" in \
|
||||
[\\/]* | ?:[\\/]*) sdir="$(srcdir)" ;; \
|
||||
*) sdir=$(subdir)/$(srcdir) ;; \
|
||||
esac; \
|
||||
for i in $$list; do \
|
||||
if test -f "$$i"; then \
|
||||
echo "$(subdir)/$$i"; \
|
||||
else \
|
||||
echo "$$sdir/$$i"; \
|
||||
fi; \
|
||||
done >> $(top_builddir)/cscope.files
|
||||
|
||||
distclean-tags:
|
||||
-rm -f TAGS ID GTAGS GRTAGS GSYMS GPATH tags
|
||||
|
||||
distdir: $(DISTFILES)
|
||||
@srcdirstrip=`echo "$(srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
topsrcdirstrip=`echo "$(top_srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
list='$(DISTFILES)'; \
|
||||
dist_files=`for file in $$list; do echo $$file; done | \
|
||||
sed -e "s|^$$srcdirstrip/||;t" \
|
||||
-e "s|^$$topsrcdirstrip/|$(top_builddir)/|;t"`; \
|
||||
case $$dist_files in \
|
||||
*/*) $(MKDIR_P) `echo "$$dist_files" | \
|
||||
sed '/\//!d;s|^|$(distdir)/|;s,/[^/]*$$,,' | \
|
||||
sort -u` ;; \
|
||||
esac; \
|
||||
for file in $$dist_files; do \
|
||||
if test -f $$file || test -d $$file; then d=.; else d=$(srcdir); fi; \
|
||||
if test -d $$d/$$file; then \
|
||||
dir=`echo "/$$file" | sed -e 's,/[^/]*$$,,'`; \
|
||||
if test -d "$(distdir)/$$file"; then \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
if test -d $(srcdir)/$$file && test $$d != $(srcdir); then \
|
||||
cp -fpR $(srcdir)/$$file "$(distdir)$$dir" || exit 1; \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
cp -fpR $$d/$$file "$(distdir)$$dir" || exit 1; \
|
||||
else \
|
||||
test -f "$(distdir)/$$file" \
|
||||
|| cp -p $$d/$$file "$(distdir)/$$file" \
|
||||
|| exit 1; \
|
||||
fi; \
|
||||
done
|
||||
check-am: all-am
|
||||
check: check-am
|
||||
all-am: Makefile $(PROGRAMS)
|
||||
installdirs:
|
||||
for dir in "$(DESTDIR)$(bindir)"; do \
|
||||
test -z "$$dir" || $(MKDIR_P) "$$dir"; \
|
||||
done
|
||||
install: install-am
|
||||
install-exec: install-exec-am
|
||||
install-data: install-data-am
|
||||
uninstall: uninstall-am
|
||||
|
||||
install-am: all-am
|
||||
@$(MAKE) $(AM_MAKEFLAGS) install-exec-am install-data-am
|
||||
|
||||
installcheck: installcheck-am
|
||||
install-strip:
|
||||
if test -z '$(STRIP)'; then \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
install; \
|
||||
else \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
"INSTALL_PROGRAM_ENV=STRIPPROG='$(STRIP)'" install; \
|
||||
fi
|
||||
mostlyclean-generic:
|
||||
|
||||
clean-generic:
|
||||
|
||||
distclean-generic:
|
||||
-test -z "$(CONFIG_CLEAN_FILES)" || rm -f $(CONFIG_CLEAN_FILES)
|
||||
-test . = "$(srcdir)" || test -z "$(CONFIG_CLEAN_VPATH_FILES)" || rm -f $(CONFIG_CLEAN_VPATH_FILES)
|
||||
|
||||
maintainer-clean-generic:
|
||||
@echo "This command is intended for maintainers to use"
|
||||
@echo "it deletes files that may require special tools to rebuild."
|
||||
clean: clean-am
|
||||
|
||||
clean-am: clean-binPROGRAMS clean-generic clean-libtool mostlyclean-am
|
||||
|
||||
distclean: distclean-am
|
||||
-rm -rf ./$(DEPDIR)
|
||||
-rm -f Makefile
|
||||
distclean-am: clean-am distclean-compile distclean-generic \
|
||||
distclean-tags
|
||||
|
||||
dvi: dvi-am
|
||||
|
||||
dvi-am:
|
||||
|
||||
html: html-am
|
||||
|
||||
html-am:
|
||||
|
||||
info: info-am
|
||||
|
||||
info-am:
|
||||
|
||||
install-data-am:
|
||||
|
||||
install-dvi: install-dvi-am
|
||||
|
||||
install-dvi-am:
|
||||
|
||||
install-exec-am: install-binPROGRAMS
|
||||
|
||||
install-html: install-html-am
|
||||
|
||||
install-html-am:
|
||||
|
||||
install-info: install-info-am
|
||||
|
||||
install-info-am:
|
||||
|
||||
install-man:
|
||||
|
||||
install-pdf: install-pdf-am
|
||||
|
||||
install-pdf-am:
|
||||
|
||||
install-ps: install-ps-am
|
||||
|
||||
install-ps-am:
|
||||
|
||||
installcheck-am:
|
||||
|
||||
maintainer-clean: maintainer-clean-am
|
||||
-rm -rf ./$(DEPDIR)
|
||||
-rm -f Makefile
|
||||
maintainer-clean-am: distclean-am maintainer-clean-generic
|
||||
|
||||
mostlyclean: mostlyclean-am
|
||||
|
||||
mostlyclean-am: mostlyclean-compile mostlyclean-generic \
|
||||
mostlyclean-libtool
|
||||
|
||||
pdf: pdf-am
|
||||
|
||||
pdf-am:
|
||||
|
||||
ps: ps-am
|
||||
|
||||
ps-am:
|
||||
|
||||
uninstall-am: uninstall-binPROGRAMS
|
||||
|
||||
.MAKE: install-am install-strip
|
||||
|
||||
.PHONY: CTAGS GTAGS TAGS all all-am check check-am clean \
|
||||
clean-binPROGRAMS clean-generic clean-libtool cscopelist-am \
|
||||
ctags ctags-am distclean distclean-compile distclean-generic \
|
||||
distclean-libtool distclean-tags distdir dvi dvi-am html \
|
||||
html-am info info-am install install-am install-binPROGRAMS \
|
||||
install-data install-data-am install-dvi install-dvi-am \
|
||||
install-exec install-exec-am install-html install-html-am \
|
||||
install-info install-info-am install-man install-pdf \
|
||||
install-pdf-am install-ps install-ps-am install-strip \
|
||||
installcheck installcheck-am installdirs maintainer-clean \
|
||||
maintainer-clean-generic mostlyclean mostlyclean-compile \
|
||||
mostlyclean-generic mostlyclean-libtool pdf pdf-am ps ps-am \
|
||||
tags tags-am uninstall uninstall-am uninstall-binPROGRAMS
|
||||
|
||||
|
||||
# Tell versions [3.59,3.63) of GNU make to not export all variables.
|
||||
# Otherwise a system limit (for SysV at least) may be exceeded.
|
||||
.NOEXPORT:
|
|
@ -1,92 +0,0 @@
|
|||
/* include/config.h.in. Generated from configure.ac by autoheader. */
|
||||
|
||||
/* Support Altivec instructions */
|
||||
#undef HAVE_ALTIVEC
|
||||
|
||||
/* Support AVX (Advanced Vector Extensions) instructions */
|
||||
#undef HAVE_AVX
|
||||
|
||||
/* Define to 1 if you have the <dlfcn.h> header file. */
|
||||
#undef HAVE_DLFCN_H
|
||||
|
||||
/* Define to 1 if you have the <inttypes.h> header file. */
|
||||
#undef HAVE_INTTYPES_H
|
||||
|
||||
/* Define to 1 if you have the <memory.h> header file. */
|
||||
#undef HAVE_MEMORY_H
|
||||
|
||||
/* Support mmx instructions */
|
||||
#undef HAVE_MMX
|
||||
|
||||
/* Support (PCLMULDQ) Carry-Free Muliplication */
|
||||
#undef HAVE_PCLMULDQ
|
||||
|
||||
/* Support SSE (Streaming SIMD Extensions) instructions */
|
||||
#undef HAVE_SSE
|
||||
|
||||
/* Support SSE2 (Streaming SIMD Extensions 2) instructions */
|
||||
#undef HAVE_SSE2
|
||||
|
||||
/* Support SSE3 (Streaming SIMD Extensions 3) instructions */
|
||||
#undef HAVE_SSE3
|
||||
|
||||
/* Support SSSE4.1 (Streaming SIMD Extensions 4.1) instructions */
|
||||
#undef HAVE_SSE4_1
|
||||
|
||||
/* Support SSSE4.2 (Streaming SIMD Extensions 4.2) instructions */
|
||||
#undef HAVE_SSE4_2
|
||||
|
||||
/* Support SSSE3 (Supplemental Streaming SIMD Extensions 3) instructions */
|
||||
#undef HAVE_SSSE3
|
||||
|
||||
/* Define to 1 if you have the <stdint.h> header file. */
|
||||
#undef HAVE_STDINT_H
|
||||
|
||||
/* Define to 1 if you have the <stdlib.h> header file. */
|
||||
#undef HAVE_STDLIB_H
|
||||
|
||||
/* Define to 1 if you have the <strings.h> header file. */
|
||||
#undef HAVE_STRINGS_H
|
||||
|
||||
/* Define to 1 if you have the <string.h> header file. */
|
||||
#undef HAVE_STRING_H
|
||||
|
||||
/* Define to 1 if you have the <sys/stat.h> header file. */
|
||||
#undef HAVE_SYS_STAT_H
|
||||
|
||||
/* Define to 1 if you have the <sys/types.h> header file. */
|
||||
#undef HAVE_SYS_TYPES_H
|
||||
|
||||
/* Define to 1 if you have the <unistd.h> header file. */
|
||||
#undef HAVE_UNISTD_H
|
||||
|
||||
/* Define to the sub-directory in which libtool stores uninstalled libraries.
|
||||
*/
|
||||
#undef LT_OBJDIR
|
||||
|
||||
/* Name of package */
|
||||
#undef PACKAGE
|
||||
|
||||
/* Define to the address where bug reports for this package should be sent. */
|
||||
#undef PACKAGE_BUGREPORT
|
||||
|
||||
/* Define to the full name of this package. */
|
||||
#undef PACKAGE_NAME
|
||||
|
||||
/* Define to the full name and version of this package. */
|
||||
#undef PACKAGE_STRING
|
||||
|
||||
/* Define to the one symbol short name of this package. */
|
||||
#undef PACKAGE_TARNAME
|
||||
|
||||
/* Define to the home page for this package. */
|
||||
#undef PACKAGE_URL
|
||||
|
||||
/* Define to the version of this package. */
|
||||
#undef PACKAGE_VERSION
|
||||
|
||||
/* Define to 1 if you have the ANSI C header files. */
|
||||
#undef STDC_HEADERS
|
||||
|
||||
/* Version number of package */
|
||||
#undef VERSION
|
|
@ -13,7 +13,12 @@
|
|||
#include <stdint.h>
|
||||
|
||||
#ifdef INTEL_SSE4
|
||||
#include <nmmintrin.h>
|
||||
#ifdef __SSE4_2__
|
||||
#include <nmmintrin.h>
|
||||
#endif
|
||||
#ifdef __SSE4_1__
|
||||
#include <smmintrin.h>
|
||||
#endif
|
||||
#endif
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
|
@ -28,6 +33,10 @@
|
|||
#include <wmmintrin.h>
|
||||
#endif
|
||||
|
||||
#if defined(ARM_NEON)
|
||||
#include <arm_neon.h>
|
||||
#endif
|
||||
|
||||
|
||||
/* These are the different ways to perform multiplication.
|
||||
Not all are implemented for all values of w.
|
||||
|
@ -36,7 +45,7 @@
|
|||
typedef enum {GF_MULT_DEFAULT,
|
||||
GF_MULT_SHIFT,
|
||||
GF_MULT_CARRY_FREE,
|
||||
GF_MULT_CARRY_FREE_GK, //ADAM
|
||||
GF_MULT_CARRY_FREE_GK,
|
||||
GF_MULT_GROUP,
|
||||
GF_MULT_BYTWO_p,
|
||||
GF_MULT_BYTWO_b,
|
||||
|
@ -56,7 +65,9 @@ typedef enum {GF_MULT_DEFAULT,
|
|||
#define GF_REGION_DOUBLE_TABLE (0x1)
|
||||
#define GF_REGION_QUAD_TABLE (0x2)
|
||||
#define GF_REGION_LAZY (0x4)
|
||||
#define GF_REGION_SIMD (0x8)
|
||||
#define GF_REGION_SSE (0x8)
|
||||
#define GF_REGION_NOSIMD (0x10)
|
||||
#define GF_REGION_NOSSE (0x10)
|
||||
#define GF_REGION_ALTMAP (0x20)
|
||||
#define GF_REGION_CAUCHY (0x40)
|
||||
|
|
|
@ -0,0 +1,20 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* gf_cpu.h
|
||||
*
|
||||
* Identifies whether the CPU supports SIMD instructions at runtime.
|
||||
*/
|
||||
|
||||
#pragma once
|
||||
|
||||
extern int gf_cpu_supports_intel_pclmul;
|
||||
extern int gf_cpu_supports_intel_sse4;
|
||||
extern int gf_cpu_supports_intel_ssse3;
|
||||
extern int gf_cpu_supports_intel_sse3;
|
||||
extern int gf_cpu_supports_intel_sse2;
|
||||
extern int gf_cpu_supports_arm_neon;
|
||||
|
||||
void gf_cpu_identify(void);
|
|
@ -30,8 +30,24 @@ typedef struct {
|
|||
int arg2;
|
||||
gf_t *base_gf;
|
||||
void *private;
|
||||
#ifdef DEBUG_FUNCTIONS
|
||||
const char *multiply;
|
||||
const char *divide;
|
||||
const char *inverse;
|
||||
const char *multiply_region;
|
||||
const char *extract_word;
|
||||
#endif
|
||||
} gf_internal_t;
|
||||
|
||||
#ifdef DEBUG_FUNCTIONS
|
||||
#define SET_FUNCTION(gf,method,size,func) \
|
||||
{ (gf)->method.size = (func); \
|
||||
((gf_internal_t*)(gf)->scratch)->method = #func; }
|
||||
#else
|
||||
#define SET_FUNCTION(gf,method,size,func) \
|
||||
(gf)->method.size = (func);
|
||||
#endif
|
||||
|
||||
extern int gf_w4_init (gf_t *gf);
|
||||
extern int gf_w4_scratch_size(int mult_type, int region_type, int divide_type, int arg1, int arg2);
|
||||
|
||||
|
@ -113,7 +129,7 @@ typedef enum {GF_E_MDEFDIV, /* Dev != Default && Mult == Default */
|
|||
GF_E_DIVCOMP, /* Mult == Composite && Div != Default */
|
||||
GF_E_CAUCOMP, /* Mult == Composite && Reg == CAUCHY */
|
||||
GF_E_DOUQUAD, /* Reg == DOUBLE && Reg == QUAD */
|
||||
GF_E_SSE__NO, /* Reg == SSE && Reg == NOSSE */
|
||||
GF_E_SIMD_NO, /* Reg == SIMD && Reg == NOSIMD */
|
||||
GF_E_CAUCHYB, /* Reg == CAUCHY && Other Reg */
|
||||
GF_E_CAUGT32, /* Reg == CAUCHY && w > 32*/
|
||||
GF_E_ARG1SET, /* Arg1 != 0 && Mult \notin COMPOSITE/SPLIT/GROUP */
|
||||
|
@ -129,9 +145,9 @@ typedef enum {GF_E_MDEFDIV, /* Dev != Default && Mult == Default */
|
|||
GF_E_QUAD__J, /* Reg == QUAD && other Reg */
|
||||
GF_E_LAZY__X, /* Reg == LAZY && not DOUBLE or QUAD*/
|
||||
GF_E_ALTSHIF, /* Mult == Shift && Reg == ALTMAP */
|
||||
GF_E_SSESHIF, /* Mult == Shift && Reg == SSE|NOSSE */
|
||||
GF_E_SSESHIF, /* Mult == Shift && Reg == SIMD|NOSIMD */
|
||||
GF_E_ALT_CFM, /* Mult == CARRY_FREE && Reg == ALTMAP */
|
||||
GF_E_SSE_CFM, /* Mult == CARRY_FREE && Reg == SSE|NOSSE */
|
||||
GF_E_SSE_CFM, /* Mult == CARRY_FREE && Reg == SIMD|NOSIMD */
|
||||
GF_E_PCLMULX, /* Mult == Carry_Free && No PCLMUL */
|
||||
GF_E_ALT_BY2, /* Mult == Bytwo_x && Reg == ALTMAP */
|
||||
GF_E_BY2_SSE, /* Mult == Bytwo_x && Reg == SSE && No SSE2 */
|
||||
|
@ -148,7 +164,7 @@ typedef enum {GF_E_MDEFDIV, /* Dev != Default && Mult == Default */
|
|||
GF_E_GR_AR_W, /* Mult == GROUP, either arg > w */
|
||||
GF_E_GR____J, /* Mult == GROUP, Reg == SSE|ALTMAP|NOSSE */
|
||||
GF_E_TABLE_W, /* Mult == TABLE, w too big */
|
||||
GF_E_TAB_SSE, /* Mult == TABLE, SSE|NOSSE only apply to w == 4 */
|
||||
GF_E_TAB_SSE, /* Mult == TABLE, SIMD|NOSIMD only apply to w == 4 */
|
||||
GF_E_TABSSE3, /* Mult == TABLE, Need SSSE3 for SSE */
|
||||
GF_E_TAB_ALT, /* Mult == TABLE, Reg == ALTMAP */
|
||||
GF_E_SP128AR, /* Mult == SPLIT, w=128, Bad arg1/arg2 */
|
||||
|
@ -172,7 +188,7 @@ typedef enum {GF_E_MDEFDIV, /* Dev != Default && Mult == Default */
|
|||
GF_E_SP_8__A, /* Mult == SPLIT, w=8, no ALTMAP */
|
||||
GF_E_SP_SSE3, /* Mult == SPLIT, Need SSSE3 for SSE */
|
||||
GF_E_COMP_A2, /* Mult == COMP, arg1 must be = 2 */
|
||||
GF_E_COMP_SS, /* Mult == COMP, SSE|NOSSE */
|
||||
GF_E_COMP_SS, /* Mult == COMP, SIMD|NOSIMD */
|
||||
GF_E_COMP__W, /* Mult == COMP, Bad w. */
|
||||
GF_E_UNKFLAG, /* Unknown flag in create_from.... */
|
||||
GF_E_UNKNOWN, /* Unknown mult_type. */
|
||||
|
|
|
@ -0,0 +1,66 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* gf_w16.h
|
||||
*
|
||||
* Defines and data structures for 16-bit Galois fields
|
||||
*/
|
||||
|
||||
#ifndef GF_COMPLETE_GF_W16_H
|
||||
#define GF_COMPLETE_GF_W16_H
|
||||
|
||||
#include <stdint.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (16)
|
||||
#define GF_FIELD_SIZE (1 << GF_FIELD_WIDTH)
|
||||
#define GF_MULT_GROUP_SIZE GF_FIELD_SIZE-1
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (8)
|
||||
#define GF_BASE_FIELD_SIZE (1 << GF_BASE_FIELD_WIDTH)
|
||||
|
||||
struct gf_w16_logtable_data {
|
||||
uint16_t log_tbl[GF_FIELD_SIZE];
|
||||
uint16_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint16_t inv_tbl[GF_FIELD_SIZE];
|
||||
uint16_t *d_antilog;
|
||||
};
|
||||
|
||||
struct gf_w16_zero_logtable_data {
|
||||
int log_tbl[GF_FIELD_SIZE];
|
||||
uint16_t _antilog_tbl[GF_FIELD_SIZE * 4];
|
||||
uint16_t *antilog_tbl;
|
||||
uint16_t inv_tbl[GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w16_lazytable_data {
|
||||
uint16_t log_tbl[GF_FIELD_SIZE];
|
||||
uint16_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint16_t inv_tbl[GF_FIELD_SIZE];
|
||||
uint16_t *d_antilog;
|
||||
uint16_t lazytable[GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w16_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
|
||||
struct gf_w16_split_8_8_data {
|
||||
uint16_t tables[3][256][256];
|
||||
};
|
||||
|
||||
struct gf_w16_group_4_4_data {
|
||||
uint16_t reduce[16];
|
||||
uint16_t shift[16];
|
||||
};
|
||||
|
||||
struct gf_w16_composite_data {
|
||||
uint8_t *mult_table;
|
||||
};
|
||||
|
||||
void gf_w16_neon_split_init(gf_t *gf);
|
||||
|
||||
#endif /* GF_COMPLETE_GF_W16_H */
|
|
@ -0,0 +1,71 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* gf_w32.h
|
||||
*
|
||||
* Defines and data structures for 32-bit Galois fields
|
||||
*/
|
||||
|
||||
#ifndef GF_COMPLETE_GF_W32_H
|
||||
#define GF_COMPLETE_GF_W32_H
|
||||
|
||||
#include <stdint.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (32)
|
||||
#define GF_FIRST_BIT ((gf_val_32_t)1 << 31)
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (16)
|
||||
#define GF_BASE_FIELD_SIZE (1 << GF_BASE_FIELD_WIDTH)
|
||||
#define GF_BASE_FIELD_GROUP_SIZE GF_BASE_FIELD_SIZE-1
|
||||
#define GF_MULTBY_TWO(p) (((p) & GF_FIRST_BIT) ? (((p) << 1) ^ h->prim_poly) : (p) << 1)
|
||||
|
||||
struct gf_split_2_32_lazy_data {
|
||||
uint32_t tables[16][4];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_w32_split_8_8_data {
|
||||
uint32_t tables[7][256][256];
|
||||
uint32_t region_tables[4][256];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_w32_group_data {
|
||||
uint32_t *reduce;
|
||||
uint32_t *shift;
|
||||
int tshift;
|
||||
uint64_t rmask;
|
||||
uint32_t *memory;
|
||||
};
|
||||
|
||||
struct gf_split_16_32_lazy_data {
|
||||
uint32_t tables[2][(1<<16)];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_8_32_lazy_data {
|
||||
uint32_t tables[4][256];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_4_32_lazy_data {
|
||||
uint32_t tables[8][16];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_w32_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
|
||||
struct gf_w32_composite_data {
|
||||
uint16_t *log;
|
||||
uint16_t *alog;
|
||||
};
|
||||
|
||||
void gf_w32_neon_split_init(gf_t *gf);
|
||||
|
||||
#endif /* GF_COMPLETE_GF_W32_H */
|
|
@ -0,0 +1,63 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* gf_w4.h
|
||||
*
|
||||
* Defines and data structures for 4-bit Galois fields
|
||||
*/
|
||||
|
||||
#ifndef GF_COMPLETE_GF_W4_H
|
||||
#define GF_COMPLETE_GF_W4_H
|
||||
|
||||
#include <stdint.h>
|
||||
|
||||
#define GF_FIELD_WIDTH 4
|
||||
#define GF_DOUBLE_WIDTH (GF_FIELD_WIDTH*2)
|
||||
#define GF_FIELD_SIZE (1 << GF_FIELD_WIDTH)
|
||||
#define GF_MULT_GROUP_SIZE (GF_FIELD_SIZE-1)
|
||||
|
||||
/* ------------------------------------------------------------
|
||||
JSP: Each implementation has its own data, which is allocated
|
||||
at one time as part of the handle. For that reason, it
|
||||
shouldn't be hierarchical -- i.e. one should be able to
|
||||
allocate it with one call to malloc. */
|
||||
|
||||
struct gf_logtable_data {
|
||||
uint8_t log_tbl[GF_FIELD_SIZE];
|
||||
uint8_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint8_t *antilog_tbl_div;
|
||||
};
|
||||
|
||||
struct gf_single_table_data {
|
||||
uint8_t mult[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_double_table_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t mult[GF_FIELD_SIZE][GF_FIELD_SIZE*GF_FIELD_SIZE];
|
||||
};
|
||||
struct gf_quad_table_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[GF_FIELD_SIZE][(1<<16)];
|
||||
};
|
||||
|
||||
struct gf_quad_table_lazy_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t smult[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[(1 << 16)];
|
||||
};
|
||||
|
||||
struct gf_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
|
||||
// ARM NEON init functions
|
||||
int gf_w4_neon_cfm_init(gf_t *gf);
|
||||
void gf_w4_neon_single_table_init(gf_t *gf);
|
||||
|
||||
#endif /* GF_COMPLETE_GF_W4_H */
|
|
@ -0,0 +1,50 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* gf_w64.h
|
||||
*
|
||||
* Defines and data structures for 64-bit Galois fields
|
||||
*/
|
||||
|
||||
#ifndef GF_COMPLETE_GF_W64_H
|
||||
#define GF_COMPLETE_GF_W64_H
|
||||
|
||||
#include <stdint.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (64)
|
||||
#define GF_FIRST_BIT (1ULL << 63)
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (32)
|
||||
#define GF_BASE_FIELD_SIZE (1ULL << GF_BASE_FIELD_WIDTH)
|
||||
#define GF_BASE_FIELD_GROUP_SIZE GF_BASE_FIELD_SIZE-1
|
||||
|
||||
struct gf_w64_group_data {
|
||||
uint64_t *reduce;
|
||||
uint64_t *shift;
|
||||
uint64_t *memory;
|
||||
};
|
||||
|
||||
struct gf_split_4_64_lazy_data {
|
||||
uint64_t tables[16][16];
|
||||
uint64_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_8_64_lazy_data {
|
||||
uint64_t tables[8][(1<<8)];
|
||||
uint64_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_16_64_lazy_data {
|
||||
uint64_t tables[4][(1<<16)];
|
||||
uint64_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_8_8_data {
|
||||
uint64_t tables[15][256][256];
|
||||
};
|
||||
|
||||
void gf_w64_neon_split_init(gf_t *gf);
|
||||
|
||||
#endif /* GF_COMPLETE_GF_W64_H */
|
|
@ -0,0 +1,99 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* gf_w8.c
|
||||
*
|
||||
* Defines and data stuctures for 8-bit Galois fields
|
||||
*/
|
||||
|
||||
#ifndef GF_COMPLETE_GF_W8_H
|
||||
#define GF_COMPLETE_GF_W8_H
|
||||
|
||||
#include "gf_int.h"
|
||||
#include <stdint.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (8)
|
||||
#define GF_FIELD_SIZE (1 << GF_FIELD_WIDTH)
|
||||
#define GF_HALF_SIZE (1 << (GF_FIELD_WIDTH/2))
|
||||
#define GF_MULT_GROUP_SIZE GF_FIELD_SIZE-1
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (4)
|
||||
#define GF_BASE_FIELD_SIZE (1 << GF_BASE_FIELD_WIDTH)
|
||||
|
||||
struct gf_w8_logtable_data {
|
||||
uint8_t log_tbl[GF_FIELD_SIZE];
|
||||
uint8_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint8_t inv_tbl[GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_logzero_table_data {
|
||||
short log_tbl[GF_FIELD_SIZE]; /* Make this signed, so that we can divide easily */
|
||||
uint8_t antilog_tbl[512+512+1];
|
||||
uint8_t *div_tbl;
|
||||
uint8_t *inv_tbl;
|
||||
};
|
||||
|
||||
struct gf_w8_logzero_small_table_data {
|
||||
short log_tbl[GF_FIELD_SIZE]; /* Make this signed, so that we can divide easily */
|
||||
uint8_t antilog_tbl[255*3];
|
||||
uint8_t inv_tbl[GF_FIELD_SIZE];
|
||||
uint8_t *div_tbl;
|
||||
};
|
||||
|
||||
struct gf_w8_composite_data {
|
||||
uint8_t *mult_table;
|
||||
};
|
||||
|
||||
/* Don't change the order of these relative to gf_w8_half_table_data */
|
||||
|
||||
struct gf_w8_default_data {
|
||||
uint8_t high[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
uint8_t low[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
uint8_t divtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t multtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_half_table_data {
|
||||
uint8_t high[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
uint8_t low[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_single_table_data {
|
||||
uint8_t divtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t multtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_double_table_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[GF_FIELD_SIZE][GF_FIELD_SIZE*GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_double_table_lazy_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t smult[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[GF_FIELD_SIZE*GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w4_logtable_data {
|
||||
uint8_t log_tbl[GF_BASE_FIELD_SIZE];
|
||||
uint8_t antilog_tbl[GF_BASE_FIELD_SIZE * 2];
|
||||
uint8_t *antilog_tbl_div;
|
||||
};
|
||||
|
||||
struct gf_w4_single_table_data {
|
||||
uint8_t div[GF_BASE_FIELD_SIZE][GF_BASE_FIELD_SIZE];
|
||||
uint8_t mult[GF_BASE_FIELD_SIZE][GF_BASE_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
|
||||
int gf_w8_neon_cfm_init(gf_t *gf);
|
||||
void gf_w8_neon_split_init(gf_t *gf);
|
||||
|
||||
#endif /* GF_COMPLETE_GF_W8_H */
|
527
install-sh
|
@ -1,527 +0,0 @@
|
|||
#!/bin/sh
|
||||
# install - install a program, script, or datafile
|
||||
|
||||
scriptversion=2011-11-20.07; # UTC
|
||||
|
||||
# This originates from X11R5 (mit/util/scripts/install.sh), which was
|
||||
# later released in X11R6 (xc/config/util/install.sh) with the
|
||||
# following copyright and license.
|
||||
#
|
||||
# Copyright (C) 1994 X Consortium
|
||||
#
|
||||
# Permission is hereby granted, free of charge, to any person obtaining a copy
|
||||
# of this software and associated documentation files (the "Software"), to
|
||||
# deal in the Software without restriction, including without limitation the
|
||||
# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
|
||||
# sell copies of the Software, and to permit persons to whom the Software is
|
||||
# furnished to do so, subject to the following conditions:
|
||||
#
|
||||
# The above copyright notice and this permission notice shall be included in
|
||||
# all copies or substantial portions of the Software.
|
||||
#
|
||||
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||||
# X CONSORTIUM BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
|
||||
# AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNEC-
|
||||
# TION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
||||
#
|
||||
# Except as contained in this notice, the name of the X Consortium shall not
|
||||
# be used in advertising or otherwise to promote the sale, use or other deal-
|
||||
# ings in this Software without prior written authorization from the X Consor-
|
||||
# tium.
|
||||
#
|
||||
#
|
||||
# FSF changes to this file are in the public domain.
|
||||
#
|
||||
# Calling this script install-sh is preferred over install.sh, to prevent
|
||||
# 'make' implicit rules from creating a file called install from it
|
||||
# when there is no Makefile.
|
||||
#
|
||||
# This script is compatible with the BSD install script, but was written
|
||||
# from scratch.
|
||||
|
||||
nl='
|
||||
'
|
||||
IFS=" "" $nl"
|
||||
|
||||
# set DOITPROG to echo to test this script
|
||||
|
||||
# Don't use :- since 4.3BSD and earlier shells don't like it.
|
||||
doit=${DOITPROG-}
|
||||
if test -z "$doit"; then
|
||||
doit_exec=exec
|
||||
else
|
||||
doit_exec=$doit
|
||||
fi
|
||||
|
||||
# Put in absolute file names if you don't have them in your path;
|
||||
# or use environment vars.
|
||||
|
||||
chgrpprog=${CHGRPPROG-chgrp}
|
||||
chmodprog=${CHMODPROG-chmod}
|
||||
chownprog=${CHOWNPROG-chown}
|
||||
cmpprog=${CMPPROG-cmp}
|
||||
cpprog=${CPPROG-cp}
|
||||
mkdirprog=${MKDIRPROG-mkdir}
|
||||
mvprog=${MVPROG-mv}
|
||||
rmprog=${RMPROG-rm}
|
||||
stripprog=${STRIPPROG-strip}
|
||||
|
||||
posix_glob='?'
|
||||
initialize_posix_glob='
|
||||
test "$posix_glob" != "?" || {
|
||||
if (set -f) 2>/dev/null; then
|
||||
posix_glob=
|
||||
else
|
||||
posix_glob=:
|
||||
fi
|
||||
}
|
||||
'
|
||||
|
||||
posix_mkdir=
|
||||
|
||||
# Desired mode of installed file.
|
||||
mode=0755
|
||||
|
||||
chgrpcmd=
|
||||
chmodcmd=$chmodprog
|
||||
chowncmd=
|
||||
mvcmd=$mvprog
|
||||
rmcmd="$rmprog -f"
|
||||
stripcmd=
|
||||
|
||||
src=
|
||||
dst=
|
||||
dir_arg=
|
||||
dst_arg=
|
||||
|
||||
copy_on_change=false
|
||||
no_target_directory=
|
||||
|
||||
usage="\
|
||||
Usage: $0 [OPTION]... [-T] SRCFILE DSTFILE
|
||||
or: $0 [OPTION]... SRCFILES... DIRECTORY
|
||||
or: $0 [OPTION]... -t DIRECTORY SRCFILES...
|
||||
or: $0 [OPTION]... -d DIRECTORIES...
|
||||
|
||||
In the 1st form, copy SRCFILE to DSTFILE.
|
||||
In the 2nd and 3rd, copy all SRCFILES to DIRECTORY.
|
||||
In the 4th, create DIRECTORIES.
|
||||
|
||||
Options:
|
||||
--help display this help and exit.
|
||||
--version display version info and exit.
|
||||
|
||||
-c (ignored)
|
||||
-C install only if different (preserve the last data modification time)
|
||||
-d create directories instead of installing files.
|
||||
-g GROUP $chgrpprog installed files to GROUP.
|
||||
-m MODE $chmodprog installed files to MODE.
|
||||
-o USER $chownprog installed files to USER.
|
||||
-s $stripprog installed files.
|
||||
-t DIRECTORY install into DIRECTORY.
|
||||
-T report an error if DSTFILE is a directory.
|
||||
|
||||
Environment variables override the default commands:
|
||||
CHGRPPROG CHMODPROG CHOWNPROG CMPPROG CPPROG MKDIRPROG MVPROG
|
||||
RMPROG STRIPPROG
|
||||
"
|
||||
|
||||
while test $# -ne 0; do
|
||||
case $1 in
|
||||
-c) ;;
|
||||
|
||||
-C) copy_on_change=true;;
|
||||
|
||||
-d) dir_arg=true;;
|
||||
|
||||
-g) chgrpcmd="$chgrpprog $2"
|
||||
shift;;
|
||||
|
||||
--help) echo "$usage"; exit $?;;
|
||||
|
||||
-m) mode=$2
|
||||
case $mode in
|
||||
*' '* | *' '* | *'
|
||||
'* | *'*'* | *'?'* | *'['*)
|
||||
echo "$0: invalid mode: $mode" >&2
|
||||
exit 1;;
|
||||
esac
|
||||
shift;;
|
||||
|
||||
-o) chowncmd="$chownprog $2"
|
||||
shift;;
|
||||
|
||||
-s) stripcmd=$stripprog;;
|
||||
|
||||
-t) dst_arg=$2
|
||||
# Protect names problematic for 'test' and other utilities.
|
||||
case $dst_arg in
|
||||
-* | [=\(\)!]) dst_arg=./$dst_arg;;
|
||||
esac
|
||||
shift;;
|
||||
|
||||
-T) no_target_directory=true;;
|
||||
|
||||
--version) echo "$0 $scriptversion"; exit $?;;
|
||||
|
||||
--) shift
|
||||
break;;
|
||||
|
||||
-*) echo "$0: invalid option: $1" >&2
|
||||
exit 1;;
|
||||
|
||||
*) break;;
|
||||
esac
|
||||
shift
|
||||
done
|
||||
|
||||
if test $# -ne 0 && test -z "$dir_arg$dst_arg"; then
|
||||
# When -d is used, all remaining arguments are directories to create.
|
||||
# When -t is used, the destination is already specified.
|
||||
# Otherwise, the last argument is the destination. Remove it from $@.
|
||||
for arg
|
||||
do
|
||||
if test -n "$dst_arg"; then
|
||||
# $@ is not empty: it contains at least $arg.
|
||||
set fnord "$@" "$dst_arg"
|
||||
shift # fnord
|
||||
fi
|
||||
shift # arg
|
||||
dst_arg=$arg
|
||||
# Protect names problematic for 'test' and other utilities.
|
||||
case $dst_arg in
|
||||
-* | [=\(\)!]) dst_arg=./$dst_arg;;
|
||||
esac
|
||||
done
|
||||
fi
|
||||
|
||||
if test $# -eq 0; then
|
||||
if test -z "$dir_arg"; then
|
||||
echo "$0: no input file specified." >&2
|
||||
exit 1
|
||||
fi
|
||||
# It's OK to call 'install-sh -d' without argument.
|
||||
# This can happen when creating conditional directories.
|
||||
exit 0
|
||||
fi
|
||||
|
||||
if test -z "$dir_arg"; then
|
||||
do_exit='(exit $ret); exit $ret'
|
||||
trap "ret=129; $do_exit" 1
|
||||
trap "ret=130; $do_exit" 2
|
||||
trap "ret=141; $do_exit" 13
|
||||
trap "ret=143; $do_exit" 15
|
||||
|
||||
# Set umask so as not to create temps with too-generous modes.
|
||||
# However, 'strip' requires both read and write access to temps.
|
||||
case $mode in
|
||||
# Optimize common cases.
|
||||
*644) cp_umask=133;;
|
||||
*755) cp_umask=22;;
|
||||
|
||||
*[0-7])
|
||||
if test -z "$stripcmd"; then
|
||||
u_plus_rw=
|
||||
else
|
||||
u_plus_rw='% 200'
|
||||
fi
|
||||
cp_umask=`expr '(' 777 - $mode % 1000 ')' $u_plus_rw`;;
|
||||
*)
|
||||
if test -z "$stripcmd"; then
|
||||
u_plus_rw=
|
||||
else
|
||||
u_plus_rw=,u+rw
|
||||
fi
|
||||
cp_umask=$mode$u_plus_rw;;
|
||||
esac
|
||||
fi
|
||||
|
||||
for src
|
||||
do
|
||||
# Protect names problematic for 'test' and other utilities.
|
||||
case $src in
|
||||
-* | [=\(\)!]) src=./$src;;
|
||||
esac
|
||||
|
||||
if test -n "$dir_arg"; then
|
||||
dst=$src
|
||||
dstdir=$dst
|
||||
test -d "$dstdir"
|
||||
dstdir_status=$?
|
||||
else
|
||||
|
||||
# Waiting for this to be detected by the "$cpprog $src $dsttmp" command
|
||||
# might cause directories to be created, which would be especially bad
|
||||
# if $src (and thus $dsttmp) contains '*'.
|
||||
if test ! -f "$src" && test ! -d "$src"; then
|
||||
echo "$0: $src does not exist." >&2
|
||||
exit 1
|
||||
fi
|
||||
|
||||
if test -z "$dst_arg"; then
|
||||
echo "$0: no destination specified." >&2
|
||||
exit 1
|
||||
fi
|
||||
dst=$dst_arg
|
||||
|
||||
# If destination is a directory, append the input filename; won't work
|
||||
# if double slashes aren't ignored.
|
||||
if test -d "$dst"; then
|
||||
if test -n "$no_target_directory"; then
|
||||
echo "$0: $dst_arg: Is a directory" >&2
|
||||
exit 1
|
||||
fi
|
||||
dstdir=$dst
|
||||
dst=$dstdir/`basename "$src"`
|
||||
dstdir_status=0
|
||||
else
|
||||
# Prefer dirname, but fall back on a substitute if dirname fails.
|
||||
dstdir=`
|
||||
(dirname "$dst") 2>/dev/null ||
|
||||
expr X"$dst" : 'X\(.*[^/]\)//*[^/][^/]*/*$' \| \
|
||||
X"$dst" : 'X\(//\)[^/]' \| \
|
||||
X"$dst" : 'X\(//\)$' \| \
|
||||
X"$dst" : 'X\(/\)' \| . 2>/dev/null ||
|
||||
echo X"$dst" |
|
||||
sed '/^X\(.*[^/]\)\/\/*[^/][^/]*\/*$/{
|
||||
s//\1/
|
||||
q
|
||||
}
|
||||
/^X\(\/\/\)[^/].*/{
|
||||
s//\1/
|
||||
q
|
||||
}
|
||||
/^X\(\/\/\)$/{
|
||||
s//\1/
|
||||
q
|
||||
}
|
||||
/^X\(\/\).*/{
|
||||
s//\1/
|
||||
q
|
||||
}
|
||||
s/.*/./; q'
|
||||
`
|
||||
|
||||
test -d "$dstdir"
|
||||
dstdir_status=$?
|
||||
fi
|
||||
fi
|
||||
|
||||
obsolete_mkdir_used=false
|
||||
|
||||
if test $dstdir_status != 0; then
|
||||
case $posix_mkdir in
|
||||
'')
|
||||
# Create intermediate dirs using mode 755 as modified by the umask.
|
||||
# This is like FreeBSD 'install' as of 1997-10-28.
|
||||
umask=`umask`
|
||||
case $stripcmd.$umask in
|
||||
# Optimize common cases.
|
||||
*[2367][2367]) mkdir_umask=$umask;;
|
||||
.*0[02][02] | .[02][02] | .[02]) mkdir_umask=22;;
|
||||
|
||||
*[0-7])
|
||||
mkdir_umask=`expr $umask + 22 \
|
||||
- $umask % 100 % 40 + $umask % 20 \
|
||||
- $umask % 10 % 4 + $umask % 2
|
||||
`;;
|
||||
*) mkdir_umask=$umask,go-w;;
|
||||
esac
|
||||
|
||||
# With -d, create the new directory with the user-specified mode.
|
||||
# Otherwise, rely on $mkdir_umask.
|
||||
if test -n "$dir_arg"; then
|
||||
mkdir_mode=-m$mode
|
||||
else
|
||||
mkdir_mode=
|
||||
fi
|
||||
|
||||
posix_mkdir=false
|
||||
case $umask in
|
||||
*[123567][0-7][0-7])
|
||||
# POSIX mkdir -p sets u+wx bits regardless of umask, which
|
||||
# is incompatible with FreeBSD 'install' when (umask & 300) != 0.
|
||||
;;
|
||||
*)
|
||||
tmpdir=${TMPDIR-/tmp}/ins$RANDOM-$$
|
||||
trap 'ret=$?; rmdir "$tmpdir/d" "$tmpdir" 2>/dev/null; exit $ret' 0
|
||||
|
||||
if (umask $mkdir_umask &&
|
||||
exec $mkdirprog $mkdir_mode -p -- "$tmpdir/d") >/dev/null 2>&1
|
||||
then
|
||||
if test -z "$dir_arg" || {
|
||||
# Check for POSIX incompatibilities with -m.
|
||||
# HP-UX 11.23 and IRIX 6.5 mkdir -m -p sets group- or
|
||||
# other-writable bit of parent directory when it shouldn't.
|
||||
# FreeBSD 6.1 mkdir -m -p sets mode of existing directory.
|
||||
ls_ld_tmpdir=`ls -ld "$tmpdir"`
|
||||
case $ls_ld_tmpdir in
|
||||
d????-?r-*) different_mode=700;;
|
||||
d????-?--*) different_mode=755;;
|
||||
*) false;;
|
||||
esac &&
|
||||
$mkdirprog -m$different_mode -p -- "$tmpdir" && {
|
||||
ls_ld_tmpdir_1=`ls -ld "$tmpdir"`
|
||||
test "$ls_ld_tmpdir" = "$ls_ld_tmpdir_1"
|
||||
}
|
||||
}
|
||||
then posix_mkdir=:
|
||||
fi
|
||||
rmdir "$tmpdir/d" "$tmpdir"
|
||||
else
|
||||
# Remove any dirs left behind by ancient mkdir implementations.
|
||||
rmdir ./$mkdir_mode ./-p ./-- 2>/dev/null
|
||||
fi
|
||||
trap '' 0;;
|
||||
esac;;
|
||||
esac
|
||||
|
||||
if
|
||||
$posix_mkdir && (
|
||||
umask $mkdir_umask &&
|
||||
$doit_exec $mkdirprog $mkdir_mode -p -- "$dstdir"
|
||||
)
|
||||
then :
|
||||
else
|
||||
|
||||
# The umask is ridiculous, or mkdir does not conform to POSIX,
|
||||
# or it failed possibly due to a race condition. Create the
|
||||
# directory the slow way, step by step, checking for races as we go.
|
||||
|
||||
case $dstdir in
|
||||
/*) prefix='/';;
|
||||
[-=\(\)!]*) prefix='./';;
|
||||
*) prefix='';;
|
||||
esac
|
||||
|
||||
eval "$initialize_posix_glob"
|
||||
|
||||
oIFS=$IFS
|
||||
IFS=/
|
||||
$posix_glob set -f
|
||||
set fnord $dstdir
|
||||
shift
|
||||
$posix_glob set +f
|
||||
IFS=$oIFS
|
||||
|
||||
prefixes=
|
||||
|
||||
for d
|
||||
do
|
||||
test X"$d" = X && continue
|
||||
|
||||
prefix=$prefix$d
|
||||
if test -d "$prefix"; then
|
||||
prefixes=
|
||||
else
|
||||
if $posix_mkdir; then
|
||||
(umask=$mkdir_umask &&
|
||||
$doit_exec $mkdirprog $mkdir_mode -p -- "$dstdir") && break
|
||||
# Don't fail if two instances are running concurrently.
|
||||
test -d "$prefix" || exit 1
|
||||
else
|
||||
case $prefix in
|
||||
*\'*) qprefix=`echo "$prefix" | sed "s/'/'\\\\\\\\''/g"`;;
|
||||
*) qprefix=$prefix;;
|
||||
esac
|
||||
prefixes="$prefixes '$qprefix'"
|
||||
fi
|
||||
fi
|
||||
prefix=$prefix/
|
||||
done
|
||||
|
||||
if test -n "$prefixes"; then
|
||||
# Don't fail if two instances are running concurrently.
|
||||
(umask $mkdir_umask &&
|
||||
eval "\$doit_exec \$mkdirprog $prefixes") ||
|
||||
test -d "$dstdir" || exit 1
|
||||
obsolete_mkdir_used=true
|
||||
fi
|
||||
fi
|
||||
fi
|
||||
|
||||
if test -n "$dir_arg"; then
|
||||
{ test -z "$chowncmd" || $doit $chowncmd "$dst"; } &&
|
||||
{ test -z "$chgrpcmd" || $doit $chgrpcmd "$dst"; } &&
|
||||
{ test "$obsolete_mkdir_used$chowncmd$chgrpcmd" = false ||
|
||||
test -z "$chmodcmd" || $doit $chmodcmd $mode "$dst"; } || exit 1
|
||||
else
|
||||
|
||||
# Make a couple of temp file names in the proper directory.
|
||||
dsttmp=$dstdir/_inst.$$_
|
||||
rmtmp=$dstdir/_rm.$$_
|
||||
|
||||
# Trap to clean up those temp files at exit.
|
||||
trap 'ret=$?; rm -f "$dsttmp" "$rmtmp" && exit $ret' 0
|
||||
|
||||
# Copy the file name to the temp name.
|
||||
(umask $cp_umask && $doit_exec $cpprog "$src" "$dsttmp") &&
|
||||
|
||||
# and set any options; do chmod last to preserve setuid bits.
|
||||
#
|
||||
# If any of these fail, we abort the whole thing. If we want to
|
||||
# ignore errors from any of these, just make sure not to ignore
|
||||
# errors from the above "$doit $cpprog $src $dsttmp" command.
|
||||
#
|
||||
{ test -z "$chowncmd" || $doit $chowncmd "$dsttmp"; } &&
|
||||
{ test -z "$chgrpcmd" || $doit $chgrpcmd "$dsttmp"; } &&
|
||||
{ test -z "$stripcmd" || $doit $stripcmd "$dsttmp"; } &&
|
||||
{ test -z "$chmodcmd" || $doit $chmodcmd $mode "$dsttmp"; } &&
|
||||
|
||||
# If -C, don't bother to copy if it wouldn't change the file.
|
||||
if $copy_on_change &&
|
||||
old=`LC_ALL=C ls -dlL "$dst" 2>/dev/null` &&
|
||||
new=`LC_ALL=C ls -dlL "$dsttmp" 2>/dev/null` &&
|
||||
|
||||
eval "$initialize_posix_glob" &&
|
||||
$posix_glob set -f &&
|
||||
set X $old && old=:$2:$4:$5:$6 &&
|
||||
set X $new && new=:$2:$4:$5:$6 &&
|
||||
$posix_glob set +f &&
|
||||
|
||||
test "$old" = "$new" &&
|
||||
$cmpprog "$dst" "$dsttmp" >/dev/null 2>&1
|
||||
then
|
||||
rm -f "$dsttmp"
|
||||
else
|
||||
# Rename the file to the real destination.
|
||||
$doit $mvcmd -f "$dsttmp" "$dst" 2>/dev/null ||
|
||||
|
||||
# The rename failed, perhaps because mv can't rename something else
|
||||
# to itself, or perhaps because mv is so ancient that it does not
|
||||
# support -f.
|
||||
{
|
||||
# Now remove or move aside any old file at destination location.
|
||||
# We try this two ways since rm can't unlink itself on some
|
||||
# systems and the destination file might be busy for other
|
||||
# reasons. In this case, the final cleanup might fail but the new
|
||||
# file should still install successfully.
|
||||
{
|
||||
test ! -f "$dst" ||
|
||||
$doit $rmcmd -f "$dst" 2>/dev/null ||
|
||||
{ $doit $mvcmd -f "$dst" "$rmtmp" 2>/dev/null &&
|
||||
{ $doit $rmcmd -f "$rmtmp" 2>/dev/null; :; }
|
||||
} ||
|
||||
{ echo "$0: cannot unlink or rename $dst" >&2
|
||||
(exit 1); exit 1
|
||||
}
|
||||
} &&
|
||||
|
||||
# Now rename the file to the real destination.
|
||||
$doit $mvcmd "$dsttmp" "$dst"
|
||||
}
|
||||
fi || exit 1
|
||||
|
||||
trap '' 0
|
||||
fi
|
||||
done
|
||||
|
||||
# Local variables:
|
||||
# eval: (add-hook 'write-file-hooks 'time-stamp)
|
||||
# time-stamp-start: "scriptversion="
|
||||
# time-stamp-format: "%:y-%02m-%02d.%02H"
|
||||
# time-stamp-time-zone: "UTC"
|
||||
# time-stamp-end: "; # UTC"
|
||||
# End:
|
272
m4/ax_ext.m4
|
@ -1,262 +1,74 @@
|
|||
#
|
||||
# Updated by KMG to support -DINTEL_SSE for GF-Complete
|
||||
# This macro is based on http://www.gnu.org/software/autoconf-archive/ax_ext.html
|
||||
# but simplified to do compile time SIMD checks only
|
||||
#
|
||||
# ===========================================================================
|
||||
# http://www.gnu.org/software/autoconf-archive/ax_ext.html
|
||||
# ===========================================================================
|
||||
#
|
||||
# SYNOPSIS
|
||||
#
|
||||
# AX_EXT
|
||||
#
|
||||
# DESCRIPTION
|
||||
#
|
||||
# Find supported SIMD extensions by requesting cpuid. When an SIMD
|
||||
# extension is found, the -m"simdextensionname" is added to SIMD_FLAGS if
|
||||
# compiler supports it. For example, if "sse2" is available, then "-msse2"
|
||||
# is added to SIMD_FLAGS.
|
||||
#
|
||||
# This macro calls:
|
||||
#
|
||||
# AC_SUBST(SIMD_FLAGS)
|
||||
#
|
||||
# And defines:
|
||||
#
|
||||
# HAVE_MMX / HAVE_SSE / HAVE_SSE2 / HAVE_SSE3 / HAVE_SSSE3 / HAVE_SSE4.1 / HAVE_SSE4.2 / HAVE_AVX
|
||||
#
|
||||
# LICENSE
|
||||
#
|
||||
# Copyright (c) 2007 Christophe Tournayre <turn3r@users.sourceforge.net>
|
||||
# Copyright (c) 2013 Michael Petch <mpetch@capp-sysware.com>
|
||||
#
|
||||
# Copying and distribution of this file, with or without modification, are
|
||||
# permitted in any medium without royalty provided the copyright notice
|
||||
# and this notice are preserved. This file is offered as-is, without any
|
||||
# warranty.
|
||||
|
||||
#serial 12
|
||||
|
||||
AC_DEFUN([AX_EXT],
|
||||
[
|
||||
AC_REQUIRE([AC_CANONICAL_HOST])
|
||||
|
||||
case $host_cpu in
|
||||
aarch64*)
|
||||
AC_DEFINE(HAVE_ARCH_AARCH64,,[targeting AArch64])
|
||||
SIMD_FLAGS="$SIMD_FLAGS -DARCH_AARCH64"
|
||||
|
||||
AC_CACHE_CHECK([whether NEON is enabled], [ax_cv_have_neon_ext], [ax_cv_have_neon_ext=yes])
|
||||
if test "$ax_cv_have_neon_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-march=armv8-a+simd, [SIMD_FLAGS="$SIMD_FLAGS -march=armv8-a+simd -DARM_NEON"], [ax_cv_have_neon_ext=no])
|
||||
fi
|
||||
;;
|
||||
|
||||
arm*)
|
||||
AC_CACHE_CHECK([whether NEON is enabled], [ax_cv_have_neon_ext], [ax_cv_have_neon_ext=yes])
|
||||
if test "$ax_cv_have_neon_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-mfpu=neon, [SIMD_FLAGS="$SIMD_FLAGS -mfpu=neon -DARM_NEON"], [ax_cv_have_neon_ext=no])
|
||||
fi
|
||||
;;
|
||||
|
||||
powerpc*)
|
||||
AC_CACHE_CHECK([whether altivec is supported], [ax_cv_have_altivec_ext],
|
||||
[
|
||||
if test `/usr/sbin/sysctl -a 2>/dev/null| grep -c hw.optional.altivec` != 0; then
|
||||
if test `/usr/sbin/sysctl -n hw.optional.altivec` = 1; then
|
||||
ax_cv_have_altivec_ext=yes
|
||||
fi
|
||||
fi
|
||||
])
|
||||
|
||||
if test "$ax_cv_have_altivec_ext" = yes; then
|
||||
AC_DEFINE(HAVE_ALTIVEC,,[Support Altivec instructions])
|
||||
AX_CHECK_COMPILE_FLAG(-faltivec, SIMD_FLAGS="$SIMD_FLAGS -faltivec", [])
|
||||
fi
|
||||
;;
|
||||
|
||||
AC_CACHE_CHECK([whether altivec is enabled], [ax_cv_have_altivec_ext], [ax_cv_have_altivec_ext=yes])
|
||||
if test "$ax_cv_have_altivec_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-faltivec, [SIMD_FLAGS="$SIMD_FLAGS -faltivec"], [ax_cv_have_altivec_ext=no])
|
||||
fi
|
||||
;;
|
||||
|
||||
i[[3456]]86*|x86_64*|amd64*)
|
||||
|
||||
AC_REQUIRE([AX_GCC_X86_CPUID])
|
||||
AC_REQUIRE([AX_GCC_X86_AVX_XGETBV])
|
||||
|
||||
AX_GCC_X86_CPUID(0x00000001)
|
||||
ecx=`echo $ax_cv_gcc_x86_cpuid_0x00000001 | cut -d ":" -f 3`
|
||||
edx=`echo $ax_cv_gcc_x86_cpuid_0x00000001 | cut -d ":" -f 4`
|
||||
|
||||
AC_CACHE_CHECK([whether mmx is supported], [ax_cv_have_mmx_ext],
|
||||
[
|
||||
ax_cv_have_mmx_ext=no
|
||||
if test "$((0x$edx>>23&0x01))" = 1; then
|
||||
ax_cv_have_mmx_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether sse is supported], [ax_cv_have_sse_ext],
|
||||
[
|
||||
ax_cv_have_sse_ext=no
|
||||
if test "$((0x$edx>>25&0x01))" = 1; then
|
||||
ax_cv_have_sse_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether sse2 is supported], [ax_cv_have_sse2_ext],
|
||||
[
|
||||
ax_cv_have_sse2_ext=no
|
||||
if test "$((0x$edx>>26&0x01))" = 1; then
|
||||
ax_cv_have_sse2_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether sse3 is supported], [ax_cv_have_sse3_ext],
|
||||
[
|
||||
ax_cv_have_sse3_ext=no
|
||||
if test "$((0x$ecx&0x01))" = 1; then
|
||||
ax_cv_have_sse3_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether pclmuldq is supported], [ax_cv_have_pclmuldq_ext],
|
||||
[
|
||||
ax_cv_have_pclmuldq_ext=no
|
||||
if test "$((0x$ecx>>1&0x01))" = 1; then
|
||||
ax_cv_have_pclmuldq_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether ssse3 is supported], [ax_cv_have_ssse3_ext],
|
||||
[
|
||||
ax_cv_have_ssse3_ext=no
|
||||
if test "$((0x$ecx>>9&0x01))" = 1; then
|
||||
ax_cv_have_ssse3_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether sse4.1 is supported], [ax_cv_have_sse41_ext],
|
||||
[
|
||||
ax_cv_have_sse41_ext=no
|
||||
if test "$((0x$ecx>>19&0x01))" = 1; then
|
||||
ax_cv_have_sse41_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether sse4.2 is supported], [ax_cv_have_sse42_ext],
|
||||
[
|
||||
ax_cv_have_sse42_ext=no
|
||||
if test "$((0x$ecx>>20&0x01))" = 1; then
|
||||
ax_cv_have_sse42_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
AC_CACHE_CHECK([whether avx is supported by processor], [ax_cv_have_avx_cpu_ext],
|
||||
[
|
||||
ax_cv_have_avx_cpu_ext=no
|
||||
if test "$((0x$ecx>>28&0x01))" = 1; then
|
||||
ax_cv_have_avx_cpu_ext=yes
|
||||
fi
|
||||
])
|
||||
|
||||
if test x"$ax_cv_have_avx_cpu_ext" = x"yes"; then
|
||||
AX_GCC_X86_AVX_XGETBV(0x00000000)
|
||||
|
||||
xgetbv_eax="0"
|
||||
if test x"$ax_cv_gcc_x86_avx_xgetbv_0x00000000" != x"unknown"; then
|
||||
xgetbv_eax=`echo $ax_cv_gcc_x86_avx_xgetbv_0x00000000 | cut -d ":" -f 1`
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether avx is supported by operating system], [ax_cv_have_avx_ext],
|
||||
[
|
||||
ax_cv_have_avx_ext=no
|
||||
|
||||
if test "$((0x$ecx>>27&0x01))" = 1; then
|
||||
if test "$((0x$xgetbv_eax&0x6))" = 6; then
|
||||
ax_cv_have_avx_ext=yes
|
||||
fi
|
||||
fi
|
||||
])
|
||||
if test x"$ax_cv_have_avx_ext" = x"no"; then
|
||||
AC_MSG_WARN([Your processor supports AVX, but your operating system doesn't])
|
||||
fi
|
||||
fi
|
||||
|
||||
if test "$ax_cv_have_mmx_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-mmmx, ax_cv_support_mmx_ext=yes, [])
|
||||
if test x"$ax_cv_support_mmx_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -mmmx"
|
||||
AC_DEFINE(HAVE_MMX,,[Support mmx instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports mmx instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
fi
|
||||
|
||||
if test "$ac_cv_sizeof_long" -eq 8; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -DARCH_64"
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether sse is enabled], [ax_cv_have_sse_ext], [ax_cv_have_sse_ext=yes])
|
||||
if test "$ax_cv_have_sse_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-msse, ax_cv_support_sse_ext=yes, [])
|
||||
if test x"$ax_cv_support_sse_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -msse -DINTEL_SSE"
|
||||
AC_DEFINE(HAVE_SSE,,[Support SSE (Streaming SIMD Extensions) instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports sse instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
AX_CHECK_COMPILE_FLAG(-msse, [SIMD_FLAGS="$SIMD_FLAGS -msse -DINTEL_SSE"], [ax_cv_have_sse_ext=no])
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether sse2 is enabled], [ax_cv_have_sse2_ext], [ax_cv_have_sse2_ext=yes])
|
||||
if test "$ax_cv_have_sse2_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-msse2, ax_cv_support_sse2_ext=yes, [])
|
||||
if test x"$ax_cv_support_sse2_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -msse2 -DINTEL_SSE2"
|
||||
AC_DEFINE(HAVE_SSE2,,[Support SSE2 (Streaming SIMD Extensions 2) instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports sse2 instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
AX_CHECK_COMPILE_FLAG(-msse2, [SIMD_FLAGS="$SIMD_FLAGS -msse2 -DINTEL_SSE2"], [ax_cv_have_sse2_ext=no])
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether sse3 is enabled], [ax_cv_have_sse3_ext], [ax_cv_have_sse3_ext=yes])
|
||||
if test "$ax_cv_have_sse3_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-msse3, ax_cv_support_sse3_ext=yes, [])
|
||||
if test x"$ax_cv_support_sse3_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -msse3 -DINTEL_SSE3"
|
||||
AC_DEFINE(HAVE_SSE3,,[Support SSE3 (Streaming SIMD Extensions 3) instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports sse3 instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
fi
|
||||
|
||||
if test "$ax_cv_have_pclmuldq_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-mpclmul, ax_cv_support_pclmuldq_ext=yes, [])
|
||||
if test x"$ax_cv_support_pclmuldq_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -mpclmul -DINTEL_SSE4_PCLMUL"
|
||||
AC_DEFINE(HAVE_PCLMULDQ,,[Support (PCLMULDQ) Carry-Free Muliplication])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports pclmuldq instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
AX_CHECK_COMPILE_FLAG(-msse3, [SIMD_FLAGS="$SIMD_FLAGS -msse3 -DINTEL_SSE3"], [ax_cv_have_sse3_ext=no])
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether ssse3 is enabled], [ax_cv_have_ssse3_ext], [ax_cv_have_ssse3_ext=yes])
|
||||
if test "$ax_cv_have_ssse3_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-mssse3, ax_cv_support_ssse3_ext=yes, [])
|
||||
if test x"$ax_cv_support_ssse3_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -mssse3 -DINTEL_SSSE3"
|
||||
AC_DEFINE(HAVE_SSSE3,,[Support SSSE3 (Supplemental Streaming SIMD Extensions 3) instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports ssse3 instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
AX_CHECK_COMPILE_FLAG(-mssse3, [SIMD_FLAGS="$SIMD_FLAGS -mssse3 -DINTEL_SSSE3"], [ax_cv_have_ssse3_ext=no])
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether pclmuldq is enabled], [ax_cv_have_pclmuldq_ext], [ax_cv_have_pclmuldq_ext=yes])
|
||||
if test "$ax_cv_have_pclmuldq_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-mpclmul, [SIMD_FLAGS="$SIMD_FLAGS -mpclmul -DINTEL_SSE4_PCLMUL"], [ax_cv_have_pclmuldq_ext=no])
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether sse4.1 is enabled], [ax_cv_have_sse41_ext], [ax_cv_have_sse41_ext=yes])
|
||||
if test "$ax_cv_have_sse41_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-msse4.1, ax_cv_support_sse41_ext=yes, [])
|
||||
if test x"$ax_cv_support_sse41_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -msse4.1 -DINTEL_SSE4"
|
||||
AC_DEFINE(HAVE_SSE4_1,,[Support SSSE4.1 (Streaming SIMD Extensions 4.1) instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports sse4.1 instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
AX_CHECK_COMPILE_FLAG(-msse4.1, [SIMD_FLAGS="$SIMD_FLAGS -msse4.1 -DINTEL_SSE4"], [ax_cv_have_sse41_ext=no])
|
||||
fi
|
||||
|
||||
AC_CACHE_CHECK([whether sse4.2 is enabled], [ax_cv_have_sse42_ext], [ax_cv_have_sse42_ext=yes])
|
||||
if test "$ax_cv_have_sse42_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-msse4.2, ax_cv_support_sse42_ext=yes, [])
|
||||
if test x"$ax_cv_support_sse42_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -msse4.2 -DINTEL_SSE4"
|
||||
AC_DEFINE(HAVE_SSE4_2,,[Support SSSE4.2 (Streaming SIMD Extensions 4.2) instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports sse4.2 instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
AX_CHECK_COMPILE_FLAG(-msse4.2, [SIMD_FLAGS="$SIMD_FLAGS -msse4.2 -DINTEL_SSE4"], [ax_cv_have_sse42_ext=no])
|
||||
fi
|
||||
|
||||
if test "$ax_cv_have_avx_ext" = yes; then
|
||||
AX_CHECK_COMPILE_FLAG(-mavx, ax_cv_support_avx_ext=yes, [])
|
||||
if test x"$ax_cv_support_avx_ext" = x"yes"; then
|
||||
SIMD_FLAGS="$SIMD_FLAGS -mavx"
|
||||
AC_DEFINE(HAVE_AVX,,[Support AVX (Advanced Vector Extensions) instructions])
|
||||
else
|
||||
AC_MSG_WARN([Your processor supports avx instructions but not your compiler, can you try another compiler?])
|
||||
fi
|
||||
fi
|
||||
|
||||
;;
|
||||
;;
|
||||
esac
|
||||
|
||||
AC_SUBST(SIMD_FLAGS)
|
||||
|
|
|
@ -1,79 +0,0 @@
|
|||
# ===========================================================================
|
||||
# http://www.gnu.org/software/autoconf-archive/ax_gcc_x86_avx_xgetbv.html
|
||||
# ===========================================================================
|
||||
#
|
||||
# SYNOPSIS
|
||||
#
|
||||
# AX_GCC_X86_AVX_XGETBV
|
||||
#
|
||||
# DESCRIPTION
|
||||
#
|
||||
# On later x86 processors with AVX SIMD support, with gcc or a compiler
|
||||
# that has a compatible syntax for inline assembly instructions, run a
|
||||
# small program that executes the xgetbv instruction with input OP. This
|
||||
# can be used to detect if the OS supports AVX instruction usage.
|
||||
#
|
||||
# On output, the values of the eax and edx registers are stored as
|
||||
# hexadecimal strings as "eax:edx" in the cache variable
|
||||
# ax_cv_gcc_x86_avx_xgetbv.
|
||||
#
|
||||
# If the xgetbv instruction fails (because you are running a
|
||||
# cross-compiler, or because you are not using gcc, or because you are on
|
||||
# a processor that doesn't have this instruction),
|
||||
# ax_cv_gcc_x86_avx_xgetbv_OP is set to the string "unknown".
|
||||
#
|
||||
# This macro mainly exists to be used in AX_EXT.
|
||||
#
|
||||
# LICENSE
|
||||
#
|
||||
# Copyright (c) 2013 Michael Petch <mpetch@capp-sysware.com>
|
||||
#
|
||||
# This program is free software: you can redistribute it and/or modify it
|
||||
# under the terms of the GNU General Public License as published by the
|
||||
# Free Software Foundation, either version 3 of the License, or (at your
|
||||
# option) any later version.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful, but
|
||||
# WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
|
||||
# Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License along
|
||||
# with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
#
|
||||
# As a special exception, the respective Autoconf Macro's copyright owner
|
||||
# gives unlimited permission to copy, distribute and modify the configure
|
||||
# scripts that are the output of Autoconf when processing the Macro. You
|
||||
# need not follow the terms of the GNU General Public License when using
|
||||
# or distributing such scripts, even though portions of the text of the
|
||||
# Macro appear in them. The GNU General Public License (GPL) does govern
|
||||
# all other use of the material that constitutes the Autoconf Macro.
|
||||
#
|
||||
# This special exception to the GPL applies to versions of the Autoconf
|
||||
# Macro released by the Autoconf Archive. When you make and distribute a
|
||||
# modified version of the Autoconf Macro, you may extend this special
|
||||
# exception to the GPL to apply to your modified version as well.
|
||||
|
||||
#serial 1
|
||||
|
||||
AC_DEFUN([AX_GCC_X86_AVX_XGETBV],
|
||||
[AC_REQUIRE([AC_PROG_CC])
|
||||
AC_LANG_PUSH([C])
|
||||
AC_CACHE_CHECK(for x86-AVX xgetbv $1 output, ax_cv_gcc_x86_avx_xgetbv_$1,
|
||||
[AC_RUN_IFELSE([AC_LANG_PROGRAM([#include <stdio.h>], [
|
||||
int op = $1, eax, edx;
|
||||
FILE *f;
|
||||
/* Opcodes for xgetbv */
|
||||
__asm__(".byte 0x0f, 0x01, 0xd0"
|
||||
: "=a" (eax), "=d" (edx)
|
||||
: "c" (op));
|
||||
f = fopen("conftest_xgetbv", "w"); if (!f) return 1;
|
||||
fprintf(f, "%x:%x\n", eax, edx);
|
||||
fclose(f);
|
||||
return 0;
|
||||
])],
|
||||
[ax_cv_gcc_x86_avx_xgetbv_$1=`cat conftest_xgetbv`; rm -f conftest_xgetbv],
|
||||
[ax_cv_gcc_x86_avx_xgetbv_$1=unknown; rm -f conftest_xgetbv],
|
||||
[ax_cv_gcc_x86_avx_xgetbv_$1=unknown])])
|
||||
AC_LANG_POP([C])
|
||||
])
|
|
@ -1,79 +0,0 @@
|
|||
# ===========================================================================
|
||||
# http://www.gnu.org/software/autoconf-archive/ax_gcc_x86_cpuid.html
|
||||
# ===========================================================================
|
||||
#
|
||||
# SYNOPSIS
|
||||
#
|
||||
# AX_GCC_X86_CPUID(OP)
|
||||
#
|
||||
# DESCRIPTION
|
||||
#
|
||||
# On Pentium and later x86 processors, with gcc or a compiler that has a
|
||||
# compatible syntax for inline assembly instructions, run a small program
|
||||
# that executes the cpuid instruction with input OP. This can be used to
|
||||
# detect the CPU type.
|
||||
#
|
||||
# On output, the values of the eax, ebx, ecx, and edx registers are stored
|
||||
# as hexadecimal strings as "eax:ebx:ecx:edx" in the cache variable
|
||||
# ax_cv_gcc_x86_cpuid_OP.
|
||||
#
|
||||
# If the cpuid instruction fails (because you are running a
|
||||
# cross-compiler, or because you are not using gcc, or because you are on
|
||||
# a processor that doesn't have this instruction), ax_cv_gcc_x86_cpuid_OP
|
||||
# is set to the string "unknown".
|
||||
#
|
||||
# This macro mainly exists to be used in AX_GCC_ARCHFLAG.
|
||||
#
|
||||
# LICENSE
|
||||
#
|
||||
# Copyright (c) 2008 Steven G. Johnson <stevenj@alum.mit.edu>
|
||||
# Copyright (c) 2008 Matteo Frigo
|
||||
#
|
||||
# This program is free software: you can redistribute it and/or modify it
|
||||
# under the terms of the GNU General Public License as published by the
|
||||
# Free Software Foundation, either version 3 of the License, or (at your
|
||||
# option) any later version.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful, but
|
||||
# WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
|
||||
# Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License along
|
||||
# with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
#
|
||||
# As a special exception, the respective Autoconf Macro's copyright owner
|
||||
# gives unlimited permission to copy, distribute and modify the configure
|
||||
# scripts that are the output of Autoconf when processing the Macro. You
|
||||
# need not follow the terms of the GNU General Public License when using
|
||||
# or distributing such scripts, even though portions of the text of the
|
||||
# Macro appear in them. The GNU General Public License (GPL) does govern
|
||||
# all other use of the material that constitutes the Autoconf Macro.
|
||||
#
|
||||
# This special exception to the GPL applies to versions of the Autoconf
|
||||
# Macro released by the Autoconf Archive. When you make and distribute a
|
||||
# modified version of the Autoconf Macro, you may extend this special
|
||||
# exception to the GPL to apply to your modified version as well.
|
||||
|
||||
#serial 7
|
||||
|
||||
AC_DEFUN([AX_GCC_X86_CPUID],
|
||||
[AC_REQUIRE([AC_PROG_CC])
|
||||
AC_LANG_PUSH([C])
|
||||
AC_CACHE_CHECK(for x86 cpuid $1 output, ax_cv_gcc_x86_cpuid_$1,
|
||||
[AC_RUN_IFELSE([AC_LANG_PROGRAM([#include <stdio.h>], [
|
||||
int op = $1, eax, ebx, ecx, edx;
|
||||
FILE *f;
|
||||
__asm__("cpuid"
|
||||
: "=a" (eax), "=b" (ebx), "=c" (ecx), "=d" (edx)
|
||||
: "a" (op));
|
||||
f = fopen("conftest_cpuid", "w"); if (!f) return 1;
|
||||
fprintf(f, "%x:%x:%x:%x\n", eax, ebx, ecx, edx);
|
||||
fclose(f);
|
||||
return 0;
|
||||
])],
|
||||
[ax_cv_gcc_x86_cpuid_$1=`cat conftest_cpuid`; rm -f conftest_cpuid],
|
||||
[ax_cv_gcc_x86_cpuid_$1=unknown; rm -f conftest_cpuid],
|
||||
[ax_cv_gcc_x86_cpuid_$1=unknown])])
|
||||
AC_LANG_POP([C])
|
||||
])
|
|
@ -1,384 +0,0 @@
|
|||
# Helper functions for option handling. -*- Autoconf -*-
|
||||
#
|
||||
# Copyright (C) 2004, 2005, 2007, 2008, 2009 Free Software Foundation,
|
||||
# Inc.
|
||||
# Written by Gary V. Vaughan, 2004
|
||||
#
|
||||
# This file is free software; the Free Software Foundation gives
|
||||
# unlimited permission to copy and/or distribute it, with or without
|
||||
# modifications, as long as this notice is preserved.
|
||||
|
||||
# serial 7 ltoptions.m4
|
||||
|
||||
# This is to help aclocal find these macros, as it can't see m4_define.
|
||||
AC_DEFUN([LTOPTIONS_VERSION], [m4_if([1])])
|
||||
|
||||
|
||||
# _LT_MANGLE_OPTION(MACRO-NAME, OPTION-NAME)
|
||||
# ------------------------------------------
|
||||
m4_define([_LT_MANGLE_OPTION],
|
||||
[[_LT_OPTION_]m4_bpatsubst($1__$2, [[^a-zA-Z0-9_]], [_])])
|
||||
|
||||
|
||||
# _LT_SET_OPTION(MACRO-NAME, OPTION-NAME)
|
||||
# ---------------------------------------
|
||||
# Set option OPTION-NAME for macro MACRO-NAME, and if there is a
|
||||
# matching handler defined, dispatch to it. Other OPTION-NAMEs are
|
||||
# saved as a flag.
|
||||
m4_define([_LT_SET_OPTION],
|
||||
[m4_define(_LT_MANGLE_OPTION([$1], [$2]))dnl
|
||||
m4_ifdef(_LT_MANGLE_DEFUN([$1], [$2]),
|
||||
_LT_MANGLE_DEFUN([$1], [$2]),
|
||||
[m4_warning([Unknown $1 option `$2'])])[]dnl
|
||||
])
|
||||
|
||||
|
||||
# _LT_IF_OPTION(MACRO-NAME, OPTION-NAME, IF-SET, [IF-NOT-SET])
|
||||
# ------------------------------------------------------------
|
||||
# Execute IF-SET if OPTION is set, IF-NOT-SET otherwise.
|
||||
m4_define([_LT_IF_OPTION],
|
||||
[m4_ifdef(_LT_MANGLE_OPTION([$1], [$2]), [$3], [$4])])
|
||||
|
||||
|
||||
# _LT_UNLESS_OPTIONS(MACRO-NAME, OPTION-LIST, IF-NOT-SET)
|
||||
# -------------------------------------------------------
|
||||
# Execute IF-NOT-SET unless all options in OPTION-LIST for MACRO-NAME
|
||||
# are set.
|
||||
m4_define([_LT_UNLESS_OPTIONS],
|
||||
[m4_foreach([_LT_Option], m4_split(m4_normalize([$2])),
|
||||
[m4_ifdef(_LT_MANGLE_OPTION([$1], _LT_Option),
|
||||
[m4_define([$0_found])])])[]dnl
|
||||
m4_ifdef([$0_found], [m4_undefine([$0_found])], [$3
|
||||
])[]dnl
|
||||
])
|
||||
|
||||
|
||||
# _LT_SET_OPTIONS(MACRO-NAME, OPTION-LIST)
|
||||
# ----------------------------------------
|
||||
# OPTION-LIST is a space-separated list of Libtool options associated
|
||||
# with MACRO-NAME. If any OPTION has a matching handler declared with
|
||||
# LT_OPTION_DEFINE, dispatch to that macro; otherwise complain about
|
||||
# the unknown option and exit.
|
||||
m4_defun([_LT_SET_OPTIONS],
|
||||
[# Set options
|
||||
m4_foreach([_LT_Option], m4_split(m4_normalize([$2])),
|
||||
[_LT_SET_OPTION([$1], _LT_Option)])
|
||||
|
||||
m4_if([$1],[LT_INIT],[
|
||||
dnl
|
||||
dnl Simply set some default values (i.e off) if boolean options were not
|
||||
dnl specified:
|
||||
_LT_UNLESS_OPTIONS([LT_INIT], [dlopen], [enable_dlopen=no
|
||||
])
|
||||
_LT_UNLESS_OPTIONS([LT_INIT], [win32-dll], [enable_win32_dll=no
|
||||
])
|
||||
dnl
|
||||
dnl If no reference was made to various pairs of opposing options, then
|
||||
dnl we run the default mode handler for the pair. For example, if neither
|
||||
dnl `shared' nor `disable-shared' was passed, we enable building of shared
|
||||
dnl archives by default:
|
||||
_LT_UNLESS_OPTIONS([LT_INIT], [shared disable-shared], [_LT_ENABLE_SHARED])
|
||||
_LT_UNLESS_OPTIONS([LT_INIT], [static disable-static], [_LT_ENABLE_STATIC])
|
||||
_LT_UNLESS_OPTIONS([LT_INIT], [pic-only no-pic], [_LT_WITH_PIC])
|
||||
_LT_UNLESS_OPTIONS([LT_INIT], [fast-install disable-fast-install],
|
||||
[_LT_ENABLE_FAST_INSTALL])
|
||||
])
|
||||
])# _LT_SET_OPTIONS
|
||||
|
||||
|
||||
## --------------------------------- ##
|
||||
## Macros to handle LT_INIT options. ##
|
||||
## --------------------------------- ##
|
||||
|
||||
# _LT_MANGLE_DEFUN(MACRO-NAME, OPTION-NAME)
|
||||
# -----------------------------------------
|
||||
m4_define([_LT_MANGLE_DEFUN],
|
||||
[[_LT_OPTION_DEFUN_]m4_bpatsubst(m4_toupper([$1__$2]), [[^A-Z0-9_]], [_])])
|
||||
|
||||
|
||||
# LT_OPTION_DEFINE(MACRO-NAME, OPTION-NAME, CODE)
|
||||
# -----------------------------------------------
|
||||
m4_define([LT_OPTION_DEFINE],
|
||||
[m4_define(_LT_MANGLE_DEFUN([$1], [$2]), [$3])[]dnl
|
||||
])# LT_OPTION_DEFINE
|
||||
|
||||
|
||||
# dlopen
|
||||
# ------
|
||||
LT_OPTION_DEFINE([LT_INIT], [dlopen], [enable_dlopen=yes
|
||||
])
|
||||
|
||||
AU_DEFUN([AC_LIBTOOL_DLOPEN],
|
||||
[_LT_SET_OPTION([LT_INIT], [dlopen])
|
||||
AC_DIAGNOSE([obsolete],
|
||||
[$0: Remove this warning and the call to _LT_SET_OPTION when you
|
||||
put the `dlopen' option into LT_INIT's first parameter.])
|
||||
])
|
||||
|
||||
dnl aclocal-1.4 backwards compatibility:
|
||||
dnl AC_DEFUN([AC_LIBTOOL_DLOPEN], [])
|
||||
|
||||
|
||||
# win32-dll
|
||||
# ---------
|
||||
# Declare package support for building win32 dll's.
|
||||
LT_OPTION_DEFINE([LT_INIT], [win32-dll],
|
||||
[enable_win32_dll=yes
|
||||
|
||||
case $host in
|
||||
*-*-cygwin* | *-*-mingw* | *-*-pw32* | *-*-cegcc*)
|
||||
AC_CHECK_TOOL(AS, as, false)
|
||||
AC_CHECK_TOOL(DLLTOOL, dlltool, false)
|
||||
AC_CHECK_TOOL(OBJDUMP, objdump, false)
|
||||
;;
|
||||
esac
|
||||
|
||||
test -z "$AS" && AS=as
|
||||
_LT_DECL([], [AS], [1], [Assembler program])dnl
|
||||
|
||||
test -z "$DLLTOOL" && DLLTOOL=dlltool
|
||||
_LT_DECL([], [DLLTOOL], [1], [DLL creation program])dnl
|
||||
|
||||
test -z "$OBJDUMP" && OBJDUMP=objdump
|
||||
_LT_DECL([], [OBJDUMP], [1], [Object dumper program])dnl
|
||||
])# win32-dll
|
||||
|
||||
AU_DEFUN([AC_LIBTOOL_WIN32_DLL],
|
||||
[AC_REQUIRE([AC_CANONICAL_HOST])dnl
|
||||
_LT_SET_OPTION([LT_INIT], [win32-dll])
|
||||
AC_DIAGNOSE([obsolete],
|
||||
[$0: Remove this warning and the call to _LT_SET_OPTION when you
|
||||
put the `win32-dll' option into LT_INIT's first parameter.])
|
||||
])
|
||||
|
||||
dnl aclocal-1.4 backwards compatibility:
|
||||
dnl AC_DEFUN([AC_LIBTOOL_WIN32_DLL], [])
|
||||
|
||||
|
||||
# _LT_ENABLE_SHARED([DEFAULT])
|
||||
# ----------------------------
|
||||
# implement the --enable-shared flag, and supports the `shared' and
|
||||
# `disable-shared' LT_INIT options.
|
||||
# DEFAULT is either `yes' or `no'. If omitted, it defaults to `yes'.
|
||||
m4_define([_LT_ENABLE_SHARED],
|
||||
[m4_define([_LT_ENABLE_SHARED_DEFAULT], [m4_if($1, no, no, yes)])dnl
|
||||
AC_ARG_ENABLE([shared],
|
||||
[AS_HELP_STRING([--enable-shared@<:@=PKGS@:>@],
|
||||
[build shared libraries @<:@default=]_LT_ENABLE_SHARED_DEFAULT[@:>@])],
|
||||
[p=${PACKAGE-default}
|
||||
case $enableval in
|
||||
yes) enable_shared=yes ;;
|
||||
no) enable_shared=no ;;
|
||||
*)
|
||||
enable_shared=no
|
||||
# Look at the argument we got. We use all the common list separators.
|
||||
lt_save_ifs="$IFS"; IFS="${IFS}$PATH_SEPARATOR,"
|
||||
for pkg in $enableval; do
|
||||
IFS="$lt_save_ifs"
|
||||
if test "X$pkg" = "X$p"; then
|
||||
enable_shared=yes
|
||||
fi
|
||||
done
|
||||
IFS="$lt_save_ifs"
|
||||
;;
|
||||
esac],
|
||||
[enable_shared=]_LT_ENABLE_SHARED_DEFAULT)
|
||||
|
||||
_LT_DECL([build_libtool_libs], [enable_shared], [0],
|
||||
[Whether or not to build shared libraries])
|
||||
])# _LT_ENABLE_SHARED
|
||||
|
||||
LT_OPTION_DEFINE([LT_INIT], [shared], [_LT_ENABLE_SHARED([yes])])
|
||||
LT_OPTION_DEFINE([LT_INIT], [disable-shared], [_LT_ENABLE_SHARED([no])])
|
||||
|
||||
# Old names:
|
||||
AC_DEFUN([AC_ENABLE_SHARED],
|
||||
[_LT_SET_OPTION([LT_INIT], m4_if([$1], [no], [disable-])[shared])
|
||||
])
|
||||
|
||||
AC_DEFUN([AC_DISABLE_SHARED],
|
||||
[_LT_SET_OPTION([LT_INIT], [disable-shared])
|
||||
])
|
||||
|
||||
AU_DEFUN([AM_ENABLE_SHARED], [AC_ENABLE_SHARED($@)])
|
||||
AU_DEFUN([AM_DISABLE_SHARED], [AC_DISABLE_SHARED($@)])
|
||||
|
||||
dnl aclocal-1.4 backwards compatibility:
|
||||
dnl AC_DEFUN([AM_ENABLE_SHARED], [])
|
||||
dnl AC_DEFUN([AM_DISABLE_SHARED], [])
|
||||
|
||||
|
||||
|
||||
# _LT_ENABLE_STATIC([DEFAULT])
|
||||
# ----------------------------
|
||||
# implement the --enable-static flag, and support the `static' and
|
||||
# `disable-static' LT_INIT options.
|
||||
# DEFAULT is either `yes' or `no'. If omitted, it defaults to `yes'.
|
||||
m4_define([_LT_ENABLE_STATIC],
|
||||
[m4_define([_LT_ENABLE_STATIC_DEFAULT], [m4_if($1, no, no, yes)])dnl
|
||||
AC_ARG_ENABLE([static],
|
||||
[AS_HELP_STRING([--enable-static@<:@=PKGS@:>@],
|
||||
[build static libraries @<:@default=]_LT_ENABLE_STATIC_DEFAULT[@:>@])],
|
||||
[p=${PACKAGE-default}
|
||||
case $enableval in
|
||||
yes) enable_static=yes ;;
|
||||
no) enable_static=no ;;
|
||||
*)
|
||||
enable_static=no
|
||||
# Look at the argument we got. We use all the common list separators.
|
||||
lt_save_ifs="$IFS"; IFS="${IFS}$PATH_SEPARATOR,"
|
||||
for pkg in $enableval; do
|
||||
IFS="$lt_save_ifs"
|
||||
if test "X$pkg" = "X$p"; then
|
||||
enable_static=yes
|
||||
fi
|
||||
done
|
||||
IFS="$lt_save_ifs"
|
||||
;;
|
||||
esac],
|
||||
[enable_static=]_LT_ENABLE_STATIC_DEFAULT)
|
||||
|
||||
_LT_DECL([build_old_libs], [enable_static], [0],
|
||||
[Whether or not to build static libraries])
|
||||
])# _LT_ENABLE_STATIC
|
||||
|
||||
LT_OPTION_DEFINE([LT_INIT], [static], [_LT_ENABLE_STATIC([yes])])
|
||||
LT_OPTION_DEFINE([LT_INIT], [disable-static], [_LT_ENABLE_STATIC([no])])
|
||||
|
||||
# Old names:
|
||||
AC_DEFUN([AC_ENABLE_STATIC],
|
||||
[_LT_SET_OPTION([LT_INIT], m4_if([$1], [no], [disable-])[static])
|
||||
])
|
||||
|
||||
AC_DEFUN([AC_DISABLE_STATIC],
|
||||
[_LT_SET_OPTION([LT_INIT], [disable-static])
|
||||
])
|
||||
|
||||
AU_DEFUN([AM_ENABLE_STATIC], [AC_ENABLE_STATIC($@)])
|
||||
AU_DEFUN([AM_DISABLE_STATIC], [AC_DISABLE_STATIC($@)])
|
||||
|
||||
dnl aclocal-1.4 backwards compatibility:
|
||||
dnl AC_DEFUN([AM_ENABLE_STATIC], [])
|
||||
dnl AC_DEFUN([AM_DISABLE_STATIC], [])
|
||||
|
||||
|
||||
|
||||
# _LT_ENABLE_FAST_INSTALL([DEFAULT])
|
||||
# ----------------------------------
|
||||
# implement the --enable-fast-install flag, and support the `fast-install'
|
||||
# and `disable-fast-install' LT_INIT options.
|
||||
# DEFAULT is either `yes' or `no'. If omitted, it defaults to `yes'.
|
||||
m4_define([_LT_ENABLE_FAST_INSTALL],
|
||||
[m4_define([_LT_ENABLE_FAST_INSTALL_DEFAULT], [m4_if($1, no, no, yes)])dnl
|
||||
AC_ARG_ENABLE([fast-install],
|
||||
[AS_HELP_STRING([--enable-fast-install@<:@=PKGS@:>@],
|
||||
[optimize for fast installation @<:@default=]_LT_ENABLE_FAST_INSTALL_DEFAULT[@:>@])],
|
||||
[p=${PACKAGE-default}
|
||||
case $enableval in
|
||||
yes) enable_fast_install=yes ;;
|
||||
no) enable_fast_install=no ;;
|
||||
*)
|
||||
enable_fast_install=no
|
||||
# Look at the argument we got. We use all the common list separators.
|
||||
lt_save_ifs="$IFS"; IFS="${IFS}$PATH_SEPARATOR,"
|
||||
for pkg in $enableval; do
|
||||
IFS="$lt_save_ifs"
|
||||
if test "X$pkg" = "X$p"; then
|
||||
enable_fast_install=yes
|
||||
fi
|
||||
done
|
||||
IFS="$lt_save_ifs"
|
||||
;;
|
||||
esac],
|
||||
[enable_fast_install=]_LT_ENABLE_FAST_INSTALL_DEFAULT)
|
||||
|
||||
_LT_DECL([fast_install], [enable_fast_install], [0],
|
||||
[Whether or not to optimize for fast installation])dnl
|
||||
])# _LT_ENABLE_FAST_INSTALL
|
||||
|
||||
LT_OPTION_DEFINE([LT_INIT], [fast-install], [_LT_ENABLE_FAST_INSTALL([yes])])
|
||||
LT_OPTION_DEFINE([LT_INIT], [disable-fast-install], [_LT_ENABLE_FAST_INSTALL([no])])
|
||||
|
||||
# Old names:
|
||||
AU_DEFUN([AC_ENABLE_FAST_INSTALL],
|
||||
[_LT_SET_OPTION([LT_INIT], m4_if([$1], [no], [disable-])[fast-install])
|
||||
AC_DIAGNOSE([obsolete],
|
||||
[$0: Remove this warning and the call to _LT_SET_OPTION when you put
|
||||
the `fast-install' option into LT_INIT's first parameter.])
|
||||
])
|
||||
|
||||
AU_DEFUN([AC_DISABLE_FAST_INSTALL],
|
||||
[_LT_SET_OPTION([LT_INIT], [disable-fast-install])
|
||||
AC_DIAGNOSE([obsolete],
|
||||
[$0: Remove this warning and the call to _LT_SET_OPTION when you put
|
||||
the `disable-fast-install' option into LT_INIT's first parameter.])
|
||||
])
|
||||
|
||||
dnl aclocal-1.4 backwards compatibility:
|
||||
dnl AC_DEFUN([AC_ENABLE_FAST_INSTALL], [])
|
||||
dnl AC_DEFUN([AM_DISABLE_FAST_INSTALL], [])
|
||||
|
||||
|
||||
# _LT_WITH_PIC([MODE])
|
||||
# --------------------
|
||||
# implement the --with-pic flag, and support the `pic-only' and `no-pic'
|
||||
# LT_INIT options.
|
||||
# MODE is either `yes' or `no'. If omitted, it defaults to `both'.
|
||||
m4_define([_LT_WITH_PIC],
|
||||
[AC_ARG_WITH([pic],
|
||||
[AS_HELP_STRING([--with-pic@<:@=PKGS@:>@],
|
||||
[try to use only PIC/non-PIC objects @<:@default=use both@:>@])],
|
||||
[lt_p=${PACKAGE-default}
|
||||
case $withval in
|
||||
yes|no) pic_mode=$withval ;;
|
||||
*)
|
||||
pic_mode=default
|
||||
# Look at the argument we got. We use all the common list separators.
|
||||
lt_save_ifs="$IFS"; IFS="${IFS}$PATH_SEPARATOR,"
|
||||
for lt_pkg in $withval; do
|
||||
IFS="$lt_save_ifs"
|
||||
if test "X$lt_pkg" = "X$lt_p"; then
|
||||
pic_mode=yes
|
||||
fi
|
||||
done
|
||||
IFS="$lt_save_ifs"
|
||||
;;
|
||||
esac],
|
||||
[pic_mode=default])
|
||||
|
||||
test -z "$pic_mode" && pic_mode=m4_default([$1], [default])
|
||||
|
||||
_LT_DECL([], [pic_mode], [0], [What type of objects to build])dnl
|
||||
])# _LT_WITH_PIC
|
||||
|
||||
LT_OPTION_DEFINE([LT_INIT], [pic-only], [_LT_WITH_PIC([yes])])
|
||||
LT_OPTION_DEFINE([LT_INIT], [no-pic], [_LT_WITH_PIC([no])])
|
||||
|
||||
# Old name:
|
||||
AU_DEFUN([AC_LIBTOOL_PICMODE],
|
||||
[_LT_SET_OPTION([LT_INIT], [pic-only])
|
||||
AC_DIAGNOSE([obsolete],
|
||||
[$0: Remove this warning and the call to _LT_SET_OPTION when you
|
||||
put the `pic-only' option into LT_INIT's first parameter.])
|
||||
])
|
||||
|
||||
dnl aclocal-1.4 backwards compatibility:
|
||||
dnl AC_DEFUN([AC_LIBTOOL_PICMODE], [])
|
||||
|
||||
## ----------------- ##
|
||||
## LTDL_INIT Options ##
|
||||
## ----------------- ##
|
||||
|
||||
m4_define([_LTDL_MODE], [])
|
||||
LT_OPTION_DEFINE([LTDL_INIT], [nonrecursive],
|
||||
[m4_define([_LTDL_MODE], [nonrecursive])])
|
||||
LT_OPTION_DEFINE([LTDL_INIT], [recursive],
|
||||
[m4_define([_LTDL_MODE], [recursive])])
|
||||
LT_OPTION_DEFINE([LTDL_INIT], [subproject],
|
||||
[m4_define([_LTDL_MODE], [subproject])])
|
||||
|
||||
m4_define([_LTDL_TYPE], [])
|
||||
LT_OPTION_DEFINE([LTDL_INIT], [installable],
|
||||
[m4_define([_LTDL_TYPE], [installable])])
|
||||
LT_OPTION_DEFINE([LTDL_INIT], [convenience],
|
||||
[m4_define([_LTDL_TYPE], [convenience])])
|
|
@ -1,123 +0,0 @@
|
|||
# ltsugar.m4 -- libtool m4 base layer. -*-Autoconf-*-
|
||||
#
|
||||
# Copyright (C) 2004, 2005, 2007, 2008 Free Software Foundation, Inc.
|
||||
# Written by Gary V. Vaughan, 2004
|
||||
#
|
||||
# This file is free software; the Free Software Foundation gives
|
||||
# unlimited permission to copy and/or distribute it, with or without
|
||||
# modifications, as long as this notice is preserved.
|
||||
|
||||
# serial 6 ltsugar.m4
|
||||
|
||||
# This is to help aclocal find these macros, as it can't see m4_define.
|
||||
AC_DEFUN([LTSUGAR_VERSION], [m4_if([0.1])])
|
||||
|
||||
|
||||
# lt_join(SEP, ARG1, [ARG2...])
|
||||
# -----------------------------
|
||||
# Produce ARG1SEPARG2...SEPARGn, omitting [] arguments and their
|
||||
# associated separator.
|
||||
# Needed until we can rely on m4_join from Autoconf 2.62, since all earlier
|
||||
# versions in m4sugar had bugs.
|
||||
m4_define([lt_join],
|
||||
[m4_if([$#], [1], [],
|
||||
[$#], [2], [[$2]],
|
||||
[m4_if([$2], [], [], [[$2]_])$0([$1], m4_shift(m4_shift($@)))])])
|
||||
m4_define([_lt_join],
|
||||
[m4_if([$#$2], [2], [],
|
||||
[m4_if([$2], [], [], [[$1$2]])$0([$1], m4_shift(m4_shift($@)))])])
|
||||
|
||||
|
||||
# lt_car(LIST)
|
||||
# lt_cdr(LIST)
|
||||
# ------------
|
||||
# Manipulate m4 lists.
|
||||
# These macros are necessary as long as will still need to support
|
||||
# Autoconf-2.59 which quotes differently.
|
||||
m4_define([lt_car], [[$1]])
|
||||
m4_define([lt_cdr],
|
||||
[m4_if([$#], 0, [m4_fatal([$0: cannot be called without arguments])],
|
||||
[$#], 1, [],
|
||||
[m4_dquote(m4_shift($@))])])
|
||||
m4_define([lt_unquote], $1)
|
||||
|
||||
|
||||
# lt_append(MACRO-NAME, STRING, [SEPARATOR])
|
||||
# ------------------------------------------
|
||||
# Redefine MACRO-NAME to hold its former content plus `SEPARATOR'`STRING'.
|
||||
# Note that neither SEPARATOR nor STRING are expanded; they are appended
|
||||
# to MACRO-NAME as is (leaving the expansion for when MACRO-NAME is invoked).
|
||||
# No SEPARATOR is output if MACRO-NAME was previously undefined (different
|
||||
# than defined and empty).
|
||||
#
|
||||
# This macro is needed until we can rely on Autoconf 2.62, since earlier
|
||||
# versions of m4sugar mistakenly expanded SEPARATOR but not STRING.
|
||||
m4_define([lt_append],
|
||||
[m4_define([$1],
|
||||
m4_ifdef([$1], [m4_defn([$1])[$3]])[$2])])
|
||||
|
||||
|
||||
|
||||
# lt_combine(SEP, PREFIX-LIST, INFIX, SUFFIX1, [SUFFIX2...])
|
||||
# ----------------------------------------------------------
|
||||
# Produce a SEP delimited list of all paired combinations of elements of
|
||||
# PREFIX-LIST with SUFFIX1 through SUFFIXn. Each element of the list
|
||||
# has the form PREFIXmINFIXSUFFIXn.
|
||||
# Needed until we can rely on m4_combine added in Autoconf 2.62.
|
||||
m4_define([lt_combine],
|
||||
[m4_if(m4_eval([$# > 3]), [1],
|
||||
[m4_pushdef([_Lt_sep], [m4_define([_Lt_sep], m4_defn([lt_car]))])]]dnl
|
||||
[[m4_foreach([_Lt_prefix], [$2],
|
||||
[m4_foreach([_Lt_suffix],
|
||||
]m4_dquote(m4_dquote(m4_shift(m4_shift(m4_shift($@)))))[,
|
||||
[_Lt_sep([$1])[]m4_defn([_Lt_prefix])[$3]m4_defn([_Lt_suffix])])])])])
|
||||
|
||||
|
||||
# lt_if_append_uniq(MACRO-NAME, VARNAME, [SEPARATOR], [UNIQ], [NOT-UNIQ])
|
||||
# -----------------------------------------------------------------------
|
||||
# Iff MACRO-NAME does not yet contain VARNAME, then append it (delimited
|
||||
# by SEPARATOR if supplied) and expand UNIQ, else NOT-UNIQ.
|
||||
m4_define([lt_if_append_uniq],
|
||||
[m4_ifdef([$1],
|
||||
[m4_if(m4_index([$3]m4_defn([$1])[$3], [$3$2$3]), [-1],
|
||||
[lt_append([$1], [$2], [$3])$4],
|
||||
[$5])],
|
||||
[lt_append([$1], [$2], [$3])$4])])
|
||||
|
||||
|
||||
# lt_dict_add(DICT, KEY, VALUE)
|
||||
# -----------------------------
|
||||
m4_define([lt_dict_add],
|
||||
[m4_define([$1($2)], [$3])])
|
||||
|
||||
|
||||
# lt_dict_add_subkey(DICT, KEY, SUBKEY, VALUE)
|
||||
# --------------------------------------------
|
||||
m4_define([lt_dict_add_subkey],
|
||||
[m4_define([$1($2:$3)], [$4])])
|
||||
|
||||
|
||||
# lt_dict_fetch(DICT, KEY, [SUBKEY])
|
||||
# ----------------------------------
|
||||
m4_define([lt_dict_fetch],
|
||||
[m4_ifval([$3],
|
||||
m4_ifdef([$1($2:$3)], [m4_defn([$1($2:$3)])]),
|
||||
m4_ifdef([$1($2)], [m4_defn([$1($2)])]))])
|
||||
|
||||
|
||||
# lt_if_dict_fetch(DICT, KEY, [SUBKEY], VALUE, IF-TRUE, [IF-FALSE])
|
||||
# -----------------------------------------------------------------
|
||||
m4_define([lt_if_dict_fetch],
|
||||
[m4_if(lt_dict_fetch([$1], [$2], [$3]), [$4],
|
||||
[$5],
|
||||
[$6])])
|
||||
|
||||
|
||||
# lt_dict_filter(DICT, [SUBKEY], VALUE, [SEPARATOR], KEY, [...])
|
||||
# --------------------------------------------------------------
|
||||
m4_define([lt_dict_filter],
|
||||
[m4_if([$5], [], [],
|
||||
[lt_join(m4_quote(m4_default([$4], [[, ]])),
|
||||
lt_unquote(m4_split(m4_normalize(m4_foreach(_Lt_key, lt_car([m4_shiftn(4, $@)]),
|
||||
[lt_if_dict_fetch([$1], _Lt_key, [$2], [$3], [_Lt_key ])])))))])[]dnl
|
||||
])
|
|
@ -1,23 +0,0 @@
|
|||
# ltversion.m4 -- version numbers -*- Autoconf -*-
|
||||
#
|
||||
# Copyright (C) 2004 Free Software Foundation, Inc.
|
||||
# Written by Scott James Remnant, 2004
|
||||
#
|
||||
# This file is free software; the Free Software Foundation gives
|
||||
# unlimited permission to copy and/or distribute it, with or without
|
||||
# modifications, as long as this notice is preserved.
|
||||
|
||||
# @configure_input@
|
||||
|
||||
# serial 3337 ltversion.m4
|
||||
# This file is part of GNU Libtool
|
||||
|
||||
m4_define([LT_PACKAGE_VERSION], [2.4.2])
|
||||
m4_define([LT_PACKAGE_REVISION], [1.3337])
|
||||
|
||||
AC_DEFUN([LTVERSION_VERSION],
|
||||
[macro_version='2.4.2'
|
||||
macro_revision='1.3337'
|
||||
_LT_DECL(, macro_version, 0, [Which release of libtool.m4 was used?])
|
||||
_LT_DECL(, macro_revision, 0)
|
||||
])
|
|
@ -1,98 +0,0 @@
|
|||
# lt~obsolete.m4 -- aclocal satisfying obsolete definitions. -*-Autoconf-*-
|
||||
#
|
||||
# Copyright (C) 2004, 2005, 2007, 2009 Free Software Foundation, Inc.
|
||||
# Written by Scott James Remnant, 2004.
|
||||
#
|
||||
# This file is free software; the Free Software Foundation gives
|
||||
# unlimited permission to copy and/or distribute it, with or without
|
||||
# modifications, as long as this notice is preserved.
|
||||
|
||||
# serial 5 lt~obsolete.m4
|
||||
|
||||
# These exist entirely to fool aclocal when bootstrapping libtool.
|
||||
#
|
||||
# In the past libtool.m4 has provided macros via AC_DEFUN (or AU_DEFUN)
|
||||
# which have later been changed to m4_define as they aren't part of the
|
||||
# exported API, or moved to Autoconf or Automake where they belong.
|
||||
#
|
||||
# The trouble is, aclocal is a bit thick. It'll see the old AC_DEFUN
|
||||
# in /usr/share/aclocal/libtool.m4 and remember it, then when it sees us
|
||||
# using a macro with the same name in our local m4/libtool.m4 it'll
|
||||
# pull the old libtool.m4 in (it doesn't see our shiny new m4_define
|
||||
# and doesn't know about Autoconf macros at all.)
|
||||
#
|
||||
# So we provide this file, which has a silly filename so it's always
|
||||
# included after everything else. This provides aclocal with the
|
||||
# AC_DEFUNs it wants, but when m4 processes it, it doesn't do anything
|
||||
# because those macros already exist, or will be overwritten later.
|
||||
# We use AC_DEFUN over AU_DEFUN for compatibility with aclocal-1.6.
|
||||
#
|
||||
# Anytime we withdraw an AC_DEFUN or AU_DEFUN, remember to add it here.
|
||||
# Yes, that means every name once taken will need to remain here until
|
||||
# we give up compatibility with versions before 1.7, at which point
|
||||
# we need to keep only those names which we still refer to.
|
||||
|
||||
# This is to help aclocal find these macros, as it can't see m4_define.
|
||||
AC_DEFUN([LTOBSOLETE_VERSION], [m4_if([1])])
|
||||
|
||||
m4_ifndef([AC_LIBTOOL_LINKER_OPTION], [AC_DEFUN([AC_LIBTOOL_LINKER_OPTION])])
|
||||
m4_ifndef([AC_PROG_EGREP], [AC_DEFUN([AC_PROG_EGREP])])
|
||||
m4_ifndef([_LT_AC_PROG_ECHO_BACKSLASH], [AC_DEFUN([_LT_AC_PROG_ECHO_BACKSLASH])])
|
||||
m4_ifndef([_LT_AC_SHELL_INIT], [AC_DEFUN([_LT_AC_SHELL_INIT])])
|
||||
m4_ifndef([_LT_AC_SYS_LIBPATH_AIX], [AC_DEFUN([_LT_AC_SYS_LIBPATH_AIX])])
|
||||
m4_ifndef([_LT_PROG_LTMAIN], [AC_DEFUN([_LT_PROG_LTMAIN])])
|
||||
m4_ifndef([_LT_AC_TAGVAR], [AC_DEFUN([_LT_AC_TAGVAR])])
|
||||
m4_ifndef([AC_LTDL_ENABLE_INSTALL], [AC_DEFUN([AC_LTDL_ENABLE_INSTALL])])
|
||||
m4_ifndef([AC_LTDL_PREOPEN], [AC_DEFUN([AC_LTDL_PREOPEN])])
|
||||
m4_ifndef([_LT_AC_SYS_COMPILER], [AC_DEFUN([_LT_AC_SYS_COMPILER])])
|
||||
m4_ifndef([_LT_AC_LOCK], [AC_DEFUN([_LT_AC_LOCK])])
|
||||
m4_ifndef([AC_LIBTOOL_SYS_OLD_ARCHIVE], [AC_DEFUN([AC_LIBTOOL_SYS_OLD_ARCHIVE])])
|
||||
m4_ifndef([_LT_AC_TRY_DLOPEN_SELF], [AC_DEFUN([_LT_AC_TRY_DLOPEN_SELF])])
|
||||
m4_ifndef([AC_LIBTOOL_PROG_CC_C_O], [AC_DEFUN([AC_LIBTOOL_PROG_CC_C_O])])
|
||||
m4_ifndef([AC_LIBTOOL_SYS_HARD_LINK_LOCKS], [AC_DEFUN([AC_LIBTOOL_SYS_HARD_LINK_LOCKS])])
|
||||
m4_ifndef([AC_LIBTOOL_OBJDIR], [AC_DEFUN([AC_LIBTOOL_OBJDIR])])
|
||||
m4_ifndef([AC_LTDL_OBJDIR], [AC_DEFUN([AC_LTDL_OBJDIR])])
|
||||
m4_ifndef([AC_LIBTOOL_PROG_LD_HARDCODE_LIBPATH], [AC_DEFUN([AC_LIBTOOL_PROG_LD_HARDCODE_LIBPATH])])
|
||||
m4_ifndef([AC_LIBTOOL_SYS_LIB_STRIP], [AC_DEFUN([AC_LIBTOOL_SYS_LIB_STRIP])])
|
||||
m4_ifndef([AC_PATH_MAGIC], [AC_DEFUN([AC_PATH_MAGIC])])
|
||||
m4_ifndef([AC_PROG_LD_GNU], [AC_DEFUN([AC_PROG_LD_GNU])])
|
||||
m4_ifndef([AC_PROG_LD_RELOAD_FLAG], [AC_DEFUN([AC_PROG_LD_RELOAD_FLAG])])
|
||||
m4_ifndef([AC_DEPLIBS_CHECK_METHOD], [AC_DEFUN([AC_DEPLIBS_CHECK_METHOD])])
|
||||
m4_ifndef([AC_LIBTOOL_PROG_COMPILER_NO_RTTI], [AC_DEFUN([AC_LIBTOOL_PROG_COMPILER_NO_RTTI])])
|
||||
m4_ifndef([AC_LIBTOOL_SYS_GLOBAL_SYMBOL_PIPE], [AC_DEFUN([AC_LIBTOOL_SYS_GLOBAL_SYMBOL_PIPE])])
|
||||
m4_ifndef([AC_LIBTOOL_PROG_COMPILER_PIC], [AC_DEFUN([AC_LIBTOOL_PROG_COMPILER_PIC])])
|
||||
m4_ifndef([AC_LIBTOOL_PROG_LD_SHLIBS], [AC_DEFUN([AC_LIBTOOL_PROG_LD_SHLIBS])])
|
||||
m4_ifndef([AC_LIBTOOL_POSTDEP_PREDEP], [AC_DEFUN([AC_LIBTOOL_POSTDEP_PREDEP])])
|
||||
m4_ifndef([LT_AC_PROG_EGREP], [AC_DEFUN([LT_AC_PROG_EGREP])])
|
||||
m4_ifndef([LT_AC_PROG_SED], [AC_DEFUN([LT_AC_PROG_SED])])
|
||||
m4_ifndef([_LT_CC_BASENAME], [AC_DEFUN([_LT_CC_BASENAME])])
|
||||
m4_ifndef([_LT_COMPILER_BOILERPLATE], [AC_DEFUN([_LT_COMPILER_BOILERPLATE])])
|
||||
m4_ifndef([_LT_LINKER_BOILERPLATE], [AC_DEFUN([_LT_LINKER_BOILERPLATE])])
|
||||
m4_ifndef([_AC_PROG_LIBTOOL], [AC_DEFUN([_AC_PROG_LIBTOOL])])
|
||||
m4_ifndef([AC_LIBTOOL_SETUP], [AC_DEFUN([AC_LIBTOOL_SETUP])])
|
||||
m4_ifndef([_LT_AC_CHECK_DLFCN], [AC_DEFUN([_LT_AC_CHECK_DLFCN])])
|
||||
m4_ifndef([AC_LIBTOOL_SYS_DYNAMIC_LINKER], [AC_DEFUN([AC_LIBTOOL_SYS_DYNAMIC_LINKER])])
|
||||
m4_ifndef([_LT_AC_TAGCONFIG], [AC_DEFUN([_LT_AC_TAGCONFIG])])
|
||||
m4_ifndef([AC_DISABLE_FAST_INSTALL], [AC_DEFUN([AC_DISABLE_FAST_INSTALL])])
|
||||
m4_ifndef([_LT_AC_LANG_CXX], [AC_DEFUN([_LT_AC_LANG_CXX])])
|
||||
m4_ifndef([_LT_AC_LANG_F77], [AC_DEFUN([_LT_AC_LANG_F77])])
|
||||
m4_ifndef([_LT_AC_LANG_GCJ], [AC_DEFUN([_LT_AC_LANG_GCJ])])
|
||||
m4_ifndef([AC_LIBTOOL_LANG_C_CONFIG], [AC_DEFUN([AC_LIBTOOL_LANG_C_CONFIG])])
|
||||
m4_ifndef([_LT_AC_LANG_C_CONFIG], [AC_DEFUN([_LT_AC_LANG_C_CONFIG])])
|
||||
m4_ifndef([AC_LIBTOOL_LANG_CXX_CONFIG], [AC_DEFUN([AC_LIBTOOL_LANG_CXX_CONFIG])])
|
||||
m4_ifndef([_LT_AC_LANG_CXX_CONFIG], [AC_DEFUN([_LT_AC_LANG_CXX_CONFIG])])
|
||||
m4_ifndef([AC_LIBTOOL_LANG_F77_CONFIG], [AC_DEFUN([AC_LIBTOOL_LANG_F77_CONFIG])])
|
||||
m4_ifndef([_LT_AC_LANG_F77_CONFIG], [AC_DEFUN([_LT_AC_LANG_F77_CONFIG])])
|
||||
m4_ifndef([AC_LIBTOOL_LANG_GCJ_CONFIG], [AC_DEFUN([AC_LIBTOOL_LANG_GCJ_CONFIG])])
|
||||
m4_ifndef([_LT_AC_LANG_GCJ_CONFIG], [AC_DEFUN([_LT_AC_LANG_GCJ_CONFIG])])
|
||||
m4_ifndef([AC_LIBTOOL_LANG_RC_CONFIG], [AC_DEFUN([AC_LIBTOOL_LANG_RC_CONFIG])])
|
||||
m4_ifndef([_LT_AC_LANG_RC_CONFIG], [AC_DEFUN([_LT_AC_LANG_RC_CONFIG])])
|
||||
m4_ifndef([AC_LIBTOOL_CONFIG], [AC_DEFUN([AC_LIBTOOL_CONFIG])])
|
||||
m4_ifndef([_LT_AC_FILE_LTDLL_C], [AC_DEFUN([_LT_AC_FILE_LTDLL_C])])
|
||||
m4_ifndef([_LT_REQUIRED_DARWIN_CHECKS], [AC_DEFUN([_LT_REQUIRED_DARWIN_CHECKS])])
|
||||
m4_ifndef([_LT_AC_PROG_CXXCPP], [AC_DEFUN([_LT_AC_PROG_CXXCPP])])
|
||||
m4_ifndef([_LT_PREPARE_SED_QUOTE_VARS], [AC_DEFUN([_LT_PREPARE_SED_QUOTE_VARS])])
|
||||
m4_ifndef([_LT_PROG_ECHO_BACKSLASH], [AC_DEFUN([_LT_PROG_ECHO_BACKSLASH])])
|
||||
m4_ifndef([_LT_PROG_F77], [AC_DEFUN([_LT_PROG_F77])])
|
||||
m4_ifndef([_LT_PROG_FC], [AC_DEFUN([_LT_PROG_FC])])
|
||||
m4_ifndef([_LT_PROG_CXX], [AC_DEFUN([_LT_PROG_CXX])])
|
After Width: | Height: | Size: 32 KiB |
After Width: | Height: | Size: 28 KiB |
After Width: | Height: | Size: 41 KiB |
After Width: | Height: | Size: 26 KiB |
After Width: | Height: | Size: 50 KiB |
After Width: | Height: | Size: 46 KiB |
After Width: | Height: | Size: 21 KiB |
|
@ -0,0 +1,404 @@
|
|||
|
||||
body {
|
||||
margin:147px 104px 147px 173px;
|
||||
|
||||
|
||||
font-size:20px;
|
||||
text-align:justify;
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
#index_number{
|
||||
|
||||
float:right;
|
||||
|
||||
}
|
||||
|
||||
a {
|
||||
|
||||
text-decoration:none;
|
||||
font-size:19px;
|
||||
color:#19191F;
|
||||
letter-spacing:1.5px;
|
||||
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
}
|
||||
/*This is page1 css */
|
||||
|
||||
#box {
|
||||
|
||||
text-align:center;
|
||||
font-size:19px;
|
||||
margin-top:166px;
|
||||
|
||||
|
||||
}
|
||||
|
||||
#body_text{
|
||||
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
font-size:18px;
|
||||
|
||||
}
|
||||
|
||||
h1{
|
||||
font-weight:inherit;
|
||||
|
||||
}
|
||||
|
||||
h4{
|
||||
font-size:22px;
|
||||
|
||||
font-weight:inherit;
|
||||
|
||||
}
|
||||
|
||||
#footer{
|
||||
|
||||
margin:1px 0px 1px 0px;
|
||||
font-size:18px;
|
||||
text-align:justify;
|
||||
padding-bottom:104px;
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
p {
|
||||
margin:0;
|
||||
text-indent: 50px;
|
||||
font-size:19px;
|
||||
text-align:justify;
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
||||
#footer_bar {
|
||||
border-top:solid;
|
||||
|
||||
border-top-width:thin;
|
||||
|
||||
}
|
||||
|
||||
#pages_paragraphs {
|
||||
margin:1px 115px 1px 57px;
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
#pages_paragraphs_2{
|
||||
margin:1px 0px 1px 0px;
|
||||
font-size:20px;
|
||||
text-align:justify;
|
||||
}
|
||||
|
||||
.code{
|
||||
font-size:22px;
|
||||
|
||||
}
|
||||
|
||||
|
||||
|
||||
|
||||
/* This is page3 css */
|
||||
|
||||
.index{
|
||||
font-weight:bold;
|
||||
text-align:justify;
|
||||
|
||||
}
|
||||
|
||||
.sub_indices {
|
||||
|
||||
padding-left:52px;
|
||||
text-align:justify;
|
||||
}
|
||||
|
||||
|
||||
|
||||
.aligning_numbers{
|
||||
|
||||
padding-left:27px;
|
||||
|
||||
|
||||
}
|
||||
|
||||
.aligning_page_number{
|
||||
|
||||
|
||||
float:right;
|
||||
|
||||
|
||||
}
|
||||
|
||||
/* This page 6 css */
|
||||
.box {
|
||||
|
||||
height:223px;
|
||||
}
|
||||
|
||||
|
||||
|
||||
.image-cell_1 {
|
||||
background: url(image1.png) no-repeat;
|
||||
width:716px;
|
||||
height:300px;
|
||||
|
||||
float:left;
|
||||
margin-left:180px;
|
||||
margin-right:134px;
|
||||
margin-bottom:1px;
|
||||
margin-bottom:31px;
|
||||
|
||||
}
|
||||
|
||||
|
||||
/* This page 9 and 10 css */
|
||||
|
||||
|
||||
|
||||
#number_spacing{
|
||||
|
||||
letter-spacing:1px;
|
||||
font-size:17px;
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
||||
#number_spacing_1{
|
||||
|
||||
letter-spacing:1px;
|
||||
font-size:19px;
|
||||
margin-left:10px;
|
||||
|
||||
|
||||
}
|
||||
|
||||
/* this page 13 css */
|
||||
|
||||
|
||||
.image-cell_2 {
|
||||
background: url(image2.png) no-repeat;
|
||||
width:939px;
|
||||
height:419px;
|
||||
|
||||
float:left;
|
||||
margin-left:68px;
|
||||
margin-right:134px;
|
||||
margin-bottom:1px;
|
||||
margin-bottom:31px;
|
||||
|
||||
}
|
||||
|
||||
/* This is page 14 */
|
||||
#data1 table{
|
||||
border-top-style:solid;
|
||||
border-left-style:solid;
|
||||
|
||||
border-bottom-style:solid;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
}
|
||||
|
||||
#data1 th{
|
||||
border-bottom-style:solid;
|
||||
border-right-style:solid;
|
||||
border-right-style:thin;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
|
||||
}
|
||||
|
||||
#data1 td {
|
||||
border-right-style:solid;
|
||||
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
}
|
||||
|
||||
|
||||
/* This is page 28 */
|
||||
#table_page28 table{
|
||||
border-top-style:solid;
|
||||
border-left-style:solid;
|
||||
|
||||
border-bottom-style:solid;
|
||||
border-top-width:thin;
|
||||
border-left-width:thin;
|
||||
border-bottom-width:thin;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
}
|
||||
|
||||
#table_page28 th{
|
||||
border-bottom-style:solid;
|
||||
border-right-style:solid;
|
||||
border-right-width:thin;
|
||||
border-bottom-width:thin;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
|
||||
}
|
||||
|
||||
#table_page28 td {
|
||||
border-right-style:solid;
|
||||
border-bottom-style:solid;
|
||||
border-bottom-width:thin;
|
||||
border-right-width:thin;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
}
|
||||
|
||||
|
||||
/* This is page 30 */
|
||||
#table_page30 table{
|
||||
border-top-style:solid;
|
||||
border-left-style:solid;
|
||||
|
||||
border-bottom-style:solid;
|
||||
|
||||
}
|
||||
|
||||
#table_page30 th{
|
||||
border-bottom-style:solid;
|
||||
border-right-style:solid;
|
||||
|
||||
|
||||
}
|
||||
|
||||
#table_page30 td {
|
||||
border-right-style:solid;
|
||||
border-bottom-style:solid;
|
||||
|
||||
|
||||
}
|
||||
#box_1 {
|
||||
|
||||
height:485px;
|
||||
margin-top:44px;
|
||||
margin-bottom:-61px;
|
||||
|
||||
}
|
||||
.image-cell_3 {
|
||||
background: url(image3.png) no-repeat;
|
||||
width:583px;
|
||||
height:393px;
|
||||
|
||||
float:left;
|
||||
|
||||
}
|
||||
|
||||
.image-cell_4 {
|
||||
background: url(image4.png) no-repeat;
|
||||
width:487px;
|
||||
height:390px;
|
||||
|
||||
float:right;
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
/* This is page 42 Css */
|
||||
|
||||
|
||||
.image-cell_5 {
|
||||
background: url(image5.png) no-repeat;
|
||||
width:907px;
|
||||
height:592px;
|
||||
|
||||
float:left;
|
||||
margin-right:134px;
|
||||
margin-bottom:1px;
|
||||
margin-bottom:31px;
|
||||
|
||||
}
|
||||
|
||||
|
||||
/* This is page 43 Css */
|
||||
|
||||
|
||||
.image-cell_6 {
|
||||
background: url(image6.png) no-repeat;
|
||||
width:851px;
|
||||
height:532px;
|
||||
|
||||
margin-right:134px;
|
||||
margin-bottom:1px;
|
||||
margin-bottom:31px;
|
||||
|
||||
}
|
||||
|
||||
/* This is page 44 Css */
|
||||
|
||||
|
||||
.image-cell_7{
|
||||
background: url(image7.png) no-repeat;
|
||||
width:945px;
|
||||
height:321px;
|
||||
|
||||
margin-right:134px;
|
||||
margin-bottom:1px;
|
||||
margin-bottom:31px;
|
||||
|
||||
}
|
||||
|
||||
/* This is page 45 */
|
||||
#data2 table{
|
||||
border-top-style:solid;
|
||||
border-left-style:solid;
|
||||
|
||||
border-bottom-style:solid;
|
||||
border-top-width:2px;
|
||||
border-left-width:2px;
|
||||
border-bottom-width:2px;
|
||||
border-color:black;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
}
|
||||
|
||||
#data2 th{
|
||||
border-bottom-style:solid;
|
||||
border-right-style:solid;
|
||||
border-bottom-width:2px;
|
||||
border-right-width:2px;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
|
||||
}
|
||||
#data2 td {
|
||||
border-right-style:solid;
|
||||
border-right-width:2px;
|
||||
font-family: 'Roboto Condensed', sans-serif;
|
||||
|
||||
}
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
|
215
missing
|
@ -1,215 +0,0 @@
|
|||
#! /bin/sh
|
||||
# Common wrapper for a few potentially missing GNU programs.
|
||||
|
||||
scriptversion=2013-10-28.13; # UTC
|
||||
|
||||
# Copyright (C) 1996-2013 Free Software Foundation, Inc.
|
||||
# Originally written by Fran,cois Pinard <pinard@iro.umontreal.ca>, 1996.
|
||||
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation; either version 2, or (at your option)
|
||||
# any later version.
|
||||
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
||||
# As a special exception to the GNU General Public License, if you
|
||||
# distribute this file as part of a program that contains a
|
||||
# configuration script generated by Autoconf, you may include it under
|
||||
# the same distribution terms that you use for the rest of that program.
|
||||
|
||||
if test $# -eq 0; then
|
||||
echo 1>&2 "Try '$0 --help' for more information"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
case $1 in
|
||||
|
||||
--is-lightweight)
|
||||
# Used by our autoconf macros to check whether the available missing
|
||||
# script is modern enough.
|
||||
exit 0
|
||||
;;
|
||||
|
||||
--run)
|
||||
# Back-compat with the calling convention used by older automake.
|
||||
shift
|
||||
;;
|
||||
|
||||
-h|--h|--he|--hel|--help)
|
||||
echo "\
|
||||
$0 [OPTION]... PROGRAM [ARGUMENT]...
|
||||
|
||||
Run 'PROGRAM [ARGUMENT]...', returning a proper advice when this fails due
|
||||
to PROGRAM being missing or too old.
|
||||
|
||||
Options:
|
||||
-h, --help display this help and exit
|
||||
-v, --version output version information and exit
|
||||
|
||||
Supported PROGRAM values:
|
||||
aclocal autoconf autoheader autom4te automake makeinfo
|
||||
bison yacc flex lex help2man
|
||||
|
||||
Version suffixes to PROGRAM as well as the prefixes 'gnu-', 'gnu', and
|
||||
'g' are ignored when checking the name.
|
||||
|
||||
Send bug reports to <bug-automake@gnu.org>."
|
||||
exit $?
|
||||
;;
|
||||
|
||||
-v|--v|--ve|--ver|--vers|--versi|--versio|--version)
|
||||
echo "missing $scriptversion (GNU Automake)"
|
||||
exit $?
|
||||
;;
|
||||
|
||||
-*)
|
||||
echo 1>&2 "$0: unknown '$1' option"
|
||||
echo 1>&2 "Try '$0 --help' for more information"
|
||||
exit 1
|
||||
;;
|
||||
|
||||
esac
|
||||
|
||||
# Run the given program, remember its exit status.
|
||||
"$@"; st=$?
|
||||
|
||||
# If it succeeded, we are done.
|
||||
test $st -eq 0 && exit 0
|
||||
|
||||
# Also exit now if we it failed (or wasn't found), and '--version' was
|
||||
# passed; such an option is passed most likely to detect whether the
|
||||
# program is present and works.
|
||||
case $2 in --version|--help) exit $st;; esac
|
||||
|
||||
# Exit code 63 means version mismatch. This often happens when the user
|
||||
# tries to use an ancient version of a tool on a file that requires a
|
||||
# minimum version.
|
||||
if test $st -eq 63; then
|
||||
msg="probably too old"
|
||||
elif test $st -eq 127; then
|
||||
# Program was missing.
|
||||
msg="missing on your system"
|
||||
else
|
||||
# Program was found and executed, but failed. Give up.
|
||||
exit $st
|
||||
fi
|
||||
|
||||
perl_URL=http://www.perl.org/
|
||||
flex_URL=http://flex.sourceforge.net/
|
||||
gnu_software_URL=http://www.gnu.org/software
|
||||
|
||||
program_details ()
|
||||
{
|
||||
case $1 in
|
||||
aclocal|automake)
|
||||
echo "The '$1' program is part of the GNU Automake package:"
|
||||
echo "<$gnu_software_URL/automake>"
|
||||
echo "It also requires GNU Autoconf, GNU m4 and Perl in order to run:"
|
||||
echo "<$gnu_software_URL/autoconf>"
|
||||
echo "<$gnu_software_URL/m4/>"
|
||||
echo "<$perl_URL>"
|
||||
;;
|
||||
autoconf|autom4te|autoheader)
|
||||
echo "The '$1' program is part of the GNU Autoconf package:"
|
||||
echo "<$gnu_software_URL/autoconf/>"
|
||||
echo "It also requires GNU m4 and Perl in order to run:"
|
||||
echo "<$gnu_software_URL/m4/>"
|
||||
echo "<$perl_URL>"
|
||||
;;
|
||||
esac
|
||||
}
|
||||
|
||||
give_advice ()
|
||||
{
|
||||
# Normalize program name to check for.
|
||||
normalized_program=`echo "$1" | sed '
|
||||
s/^gnu-//; t
|
||||
s/^gnu//; t
|
||||
s/^g//; t'`
|
||||
|
||||
printf '%s\n' "'$1' is $msg."
|
||||
|
||||
configure_deps="'configure.ac' or m4 files included by 'configure.ac'"
|
||||
case $normalized_program in
|
||||
autoconf*)
|
||||
echo "You should only need it if you modified 'configure.ac',"
|
||||
echo "or m4 files included by it."
|
||||
program_details 'autoconf'
|
||||
;;
|
||||
autoheader*)
|
||||
echo "You should only need it if you modified 'acconfig.h' or"
|
||||
echo "$configure_deps."
|
||||
program_details 'autoheader'
|
||||
;;
|
||||
automake*)
|
||||
echo "You should only need it if you modified 'Makefile.am' or"
|
||||
echo "$configure_deps."
|
||||
program_details 'automake'
|
||||
;;
|
||||
aclocal*)
|
||||
echo "You should only need it if you modified 'acinclude.m4' or"
|
||||
echo "$configure_deps."
|
||||
program_details 'aclocal'
|
||||
;;
|
||||
autom4te*)
|
||||
echo "You might have modified some maintainer files that require"
|
||||
echo "the 'autom4te' program to be rebuilt."
|
||||
program_details 'autom4te'
|
||||
;;
|
||||
bison*|yacc*)
|
||||
echo "You should only need it if you modified a '.y' file."
|
||||
echo "You may want to install the GNU Bison package:"
|
||||
echo "<$gnu_software_URL/bison/>"
|
||||
;;
|
||||
lex*|flex*)
|
||||
echo "You should only need it if you modified a '.l' file."
|
||||
echo "You may want to install the Fast Lexical Analyzer package:"
|
||||
echo "<$flex_URL>"
|
||||
;;
|
||||
help2man*)
|
||||
echo "You should only need it if you modified a dependency" \
|
||||
"of a man page."
|
||||
echo "You may want to install the GNU Help2man package:"
|
||||
echo "<$gnu_software_URL/help2man/>"
|
||||
;;
|
||||
makeinfo*)
|
||||
echo "You should only need it if you modified a '.texi' file, or"
|
||||
echo "any other file indirectly affecting the aspect of the manual."
|
||||
echo "You might want to install the Texinfo package:"
|
||||
echo "<$gnu_software_URL/texinfo/>"
|
||||
echo "The spurious makeinfo call might also be the consequence of"
|
||||
echo "using a buggy 'make' (AIX, DU, IRIX), in which case you might"
|
||||
echo "want to install GNU make:"
|
||||
echo "<$gnu_software_URL/make/>"
|
||||
;;
|
||||
*)
|
||||
echo "You might have modified some files without having the proper"
|
||||
echo "tools for further handling them. Check the 'README' file, it"
|
||||
echo "often tells you about the needed prerequisites for installing"
|
||||
echo "this package. You may also peek at any GNU archive site, in"
|
||||
echo "case some other package contains this missing '$1' program."
|
||||
;;
|
||||
esac
|
||||
}
|
||||
|
||||
give_advice "$1" | sed -e '1s/^/WARNING: /' \
|
||||
-e '2,$s/^/ /' >&2
|
||||
|
||||
# Propagate the correct exit status (expected to be 127 for a program
|
||||
# not found, 63 for a program that failed due to version mismatch).
|
||||
exit $st
|
||||
|
||||
# Local variables:
|
||||
# eval: (add-hook 'write-file-hooks 'time-stamp)
|
||||
# time-stamp-start: "scriptversion="
|
||||
# time-stamp-format: "%:y-%02m-%02d.%02H"
|
||||
# time-stamp-time-zone: "UTC"
|
||||
# time-stamp-end: "; # UTC"
|
||||
# End:
|
|
@ -1,86 +0,0 @@
|
|||
#
|
||||
# GNUmakefile for Galois field library
|
||||
#
|
||||
# The default flags do *not* have the SSE instructions enabled.
|
||||
# Please cd to flag_tester and run which_compile_flags.sh to see which SSE instructions
|
||||
# your machine and compiler support, and which flags you should include below.
|
||||
|
||||
CFLAGS = -O3
|
||||
LDFLAGS = -O3
|
||||
|
||||
SRCS = gf_w4.c gf_w8.c gf_w16.c gf_w32.c gf_w64.c gf_w128.c gf_wgen.c gf.c gf_unit.c \
|
||||
gf_time.c gf_mult.c gf_method.c gf_methods.c gf_div.c gf_rand.c gf_general.c \
|
||||
gf_poly.c gf_example_1.c gf_add.c gf_example_2.c gf_example_3.c gf_example_4.c \
|
||||
gf_inline_time.c gf_example_5.c gf_example_6.c gf_example_7.c
|
||||
|
||||
HDRS = gf_complete.h gf_int.h
|
||||
|
||||
EXECUTABLES = gf_mult gf_div gf_add gf_unit gf_time gf_methods gf_poly \
|
||||
gf_example_1 gf_example_2 gf_example_3 gf_example_4 gf_inline_time \
|
||||
gf_example_5 gf_example_6 gf_example_7
|
||||
|
||||
RM = /bin/rm -f
|
||||
|
||||
LIBOBJS = gf.o gf_method.o gf_wgen.o gf_w4.o gf_w8.o gf_w16.o gf_w32.o \
|
||||
gf_w64.o gf_w128.o gf_rand.o gf_general.o
|
||||
|
||||
OBJS = $(addsuffix .o, $(basename $(SRCS)))
|
||||
|
||||
DEFAULT = $(EXECUTABLES) gf_complete.a
|
||||
|
||||
default: $(DEFAULT)
|
||||
|
||||
all: $(OBJS)
|
||||
|
||||
gf_complete.a: $(LIBOBJS)
|
||||
ar ru gf_complete.a $(LIBOBJS)
|
||||
ranlib gf_complete.a
|
||||
|
||||
gf_methods: gf_methods.o gf_complete.a
|
||||
gf_time: gf_time.o gf_complete.a
|
||||
gf_inline_time: gf_inline_time.o gf_complete.a
|
||||
gf_unit: gf_unit.o gf_complete.a
|
||||
gf_example_1: gf_example_1.o gf_complete.a
|
||||
gf_example_2: gf_example_2.o gf_complete.a
|
||||
gf_example_3: gf_example_3.o gf_complete.a
|
||||
gf_example_4: gf_example_4.o gf_complete.a
|
||||
gf_example_5: gf_example_5.o gf_complete.a
|
||||
gf_example_6: gf_example_6.o gf_complete.a
|
||||
gf_example_7: gf_example_7.o gf_complete.a
|
||||
gf_mult: gf_mult.o gf_complete.a
|
||||
gf_div: gf_div.o gf_complete.a
|
||||
gf_poly: gf_poly.o gf_complete.a
|
||||
gf_add: gf_add.o
|
||||
|
||||
clean:
|
||||
$(RM) $(OBJS) gf_div.c
|
||||
|
||||
spotless: clean
|
||||
$(RM) *~ $(EXECUTABLES) which_compile_flags
|
||||
$(RM) gf_complete.a
|
||||
|
||||
gf_div.o: gf_complete.h gf_method.h
|
||||
gf_methods.o: gf_complete.h gf_method.h
|
||||
gf_time.o: gf_complete.h gf_method.h gf_rand.h gf_general.h
|
||||
gf_inline_time.o: gf_complete.h gf_rand.h
|
||||
gf_wgen.o: gf_int.h gf_complete.h
|
||||
gf_w4.o: gf_int.h gf_complete.h
|
||||
gf_w8.o: gf_int.h gf_complete.h
|
||||
gf_w16.o: gf_int.h gf_complete.h
|
||||
gf_w32.o: gf_int.h gf_complete.h
|
||||
gf_w64.o: gf_int.h gf_complete.h
|
||||
gf_unit.o: gf_complete.h gf_method.h gf_rand.h gf_general.h
|
||||
gf_example_1.o: gf_complete.h gf_rand.h
|
||||
gf_example_2.o: gf_complete.h gf_rand.h
|
||||
gf_example_3.o: gf_complete.h gf_rand.h
|
||||
gf_example_4.o: gf_complete.h gf_rand.h
|
||||
gf_example_5.o: gf_complete.h gf_rand.h
|
||||
gf_example_6.o: gf_complete.h gf_rand.h
|
||||
gf_example_7.o: gf_complete.h gf_rand.h
|
||||
gf_general.o: gf_complete.h gf_int.h gf_general.h gf_rand.h
|
||||
gf_mult.o: gf_complete.h gf_method.h
|
||||
gf.o: gf_complete.h gf_int.h
|
||||
gf_method.o: gf_complete.h
|
||||
|
||||
gf_div.c: gf_mult.c
|
||||
sed -e 's/product/quotient/' -e 's/multiply/divide/g' -e 's/multiplication/division/' -e 's/mult/div/' gf_mult.c > gf_div.c
|
|
@ -1,62 +0,0 @@
|
|||
# GF-Complete AM file
|
||||
# Only creates library and distributes header files
|
||||
|
||||
INCLUDES=-I./
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
|
||||
lib_LTLIBRARIES = libgf_complete.la
|
||||
libgf_complete_la_SOURCES = gf.c gf_method.c gf_wgen.c gf_w4.c gf_w8.c gf_w16.c gf_w32.c \
|
||||
gf_w64.c gf_w128.c gf_rand.c gf_general.c
|
||||
libgf_complete_la_LDFLAGS = -version-info 1:0:0
|
||||
include_HEADERS = gf_complete.h
|
||||
|
||||
bin_PROGRAMS = gf_mult gf_div gf_add gf_unit gf_time gf_methods gf_poly \
|
||||
gf_example_1 gf_example_2 gf_example_3 gf_example_4 gf_inline_time \
|
||||
gf_example_5 gf_example_6 gf_example_7
|
||||
|
||||
gf_mult_SOURCES = gf_mult.c
|
||||
gf_mult_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_div_SOURCES = gf_div.c
|
||||
gf_div_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_add_SOURCES = gf_add.c
|
||||
gf_add_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_unit_SOURCES = gf_unit.c
|
||||
gf_unit_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_time_SOURCES = gf_time.c
|
||||
gf_time_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_methods_SOURCES = gf_methods.c
|
||||
gf_methods_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_poly_SOURCES = gf_poly.c
|
||||
gf_poly_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_inline_time_SOURCES = gf_inline_time.c
|
||||
gf_inline_time_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_example_1_SOURCES = gf_example_1.c
|
||||
gf_example_1_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_example_2_SOURCES = gf_example_2.c
|
||||
gf_example_2_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_example_3_SOURCES = gf_example_3.c
|
||||
gf_example_3_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_example_4_SOURCES = gf_example_4.c
|
||||
gf_example_4_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_example_5_SOURCES = gf_example_5.c
|
||||
gf_example_5_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_example_6_SOURCES = gf_example_6.c
|
||||
gf_example_6_LDFLAGS = -lgf_complete
|
||||
|
||||
gf_example_7_SOURCES = gf_example_7.c
|
||||
gf_example_7_LDFLAGS = -lgf_complete
|
||||
|
||||
|
|
@ -1,11 +1,32 @@
|
|||
# GF-Complete 'core' AM file
|
||||
# Creates the library
|
||||
|
||||
INCLUDES=-I./ -I../include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
AUTOMAKE_OPTIONS = subdir-objects
|
||||
|
||||
AM_CPPFLAGS = -I$(top_builddir)/include -I$(top_srcdir)/include
|
||||
|
||||
# avoid using SIMD_FLAGS for code that calls strcmp as new gcc
|
||||
# versions will use SIMD for the strcmp implementation. Instead
|
||||
# we create a static library just for gf_method that is not compiled
|
||||
# with SIMD_FLAGS, this static library will get linked into gf_complete.so
|
||||
noinst_LTLIBRARIES = libgf_util.la
|
||||
libgf_util_la_SOURCES = gf_method.c
|
||||
libgf_util_la_CFLAGS = -O3 -fPIC -Wsign-compare
|
||||
|
||||
# we narrowly use SIMD_FLAGS for code that needs it
|
||||
lib_LTLIBRARIES = libgf_complete.la
|
||||
libgf_complete_la_SOURCES = gf.c gf_method.c gf_wgen.c gf_w4.c gf_w8.c gf_w16.c gf_w32.c \
|
||||
gf_w64.c gf_w128.c gf_rand.c gf_general.c
|
||||
libgf_complete_la_SOURCES = gf.c gf_wgen.c gf_w4.c gf_w8.c gf_w16.c gf_w32.c \
|
||||
gf_w64.c gf_w128.c gf_rand.c gf_general.c gf_cpu.c
|
||||
libgf_complete_la_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC -Wsign-compare
|
||||
libgf_complete_la_LIBADD = libgf_util.la
|
||||
|
||||
if HAVE_NEON
|
||||
libgf_complete_la_SOURCES += neon/gf_w4_neon.c \
|
||||
neon/gf_w8_neon.c \
|
||||
neon/gf_w16_neon.c \
|
||||
neon/gf_w32_neon.c \
|
||||
neon/gf_w64_neon.c
|
||||
endif
|
||||
|
||||
libgf_complete_la_LDFLAGS = -version-info 1:0:0
|
||||
|
||||
|
|
654
src/Makefile.in
|
@ -1,654 +0,0 @@
|
|||
# Makefile.in generated by automake 1.14.1 from Makefile.am.
|
||||
# @configure_input@
|
||||
|
||||
# Copyright (C) 1994-2013 Free Software Foundation, Inc.
|
||||
|
||||
# This Makefile.in is free software; the Free Software Foundation
|
||||
# gives unlimited permission to copy and/or distribute it,
|
||||
# with or without modifications, as long as this notice is preserved.
|
||||
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY, to the extent permitted by law; without
|
||||
# even the implied warranty of MERCHANTABILITY or FITNESS FOR A
|
||||
# PARTICULAR PURPOSE.
|
||||
|
||||
@SET_MAKE@
|
||||
|
||||
# GF-Complete 'core' AM file
|
||||
# Creates the library
|
||||
|
||||
VPATH = @srcdir@
|
||||
am__is_gnu_make = test -n '$(MAKEFILE_LIST)' && test -n '$(MAKELEVEL)'
|
||||
am__make_running_with_option = \
|
||||
case $${target_option-} in \
|
||||
?) ;; \
|
||||
*) echo "am__make_running_with_option: internal error: invalid" \
|
||||
"target option '$${target_option-}' specified" >&2; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
has_opt=no; \
|
||||
sane_makeflags=$$MAKEFLAGS; \
|
||||
if $(am__is_gnu_make); then \
|
||||
sane_makeflags=$$MFLAGS; \
|
||||
else \
|
||||
case $$MAKEFLAGS in \
|
||||
*\\[\ \ ]*) \
|
||||
bs=\\; \
|
||||
sane_makeflags=`printf '%s\n' "$$MAKEFLAGS" \
|
||||
| sed "s/$$bs$$bs[$$bs $$bs ]*//g"`;; \
|
||||
esac; \
|
||||
fi; \
|
||||
skip_next=no; \
|
||||
strip_trailopt () \
|
||||
{ \
|
||||
flg=`printf '%s\n' "$$flg" | sed "s/$$1.*$$//"`; \
|
||||
}; \
|
||||
for flg in $$sane_makeflags; do \
|
||||
test $$skip_next = yes && { skip_next=no; continue; }; \
|
||||
case $$flg in \
|
||||
*=*|--*) continue;; \
|
||||
-*I) strip_trailopt 'I'; skip_next=yes;; \
|
||||
-*I?*) strip_trailopt 'I';; \
|
||||
-*O) strip_trailopt 'O'; skip_next=yes;; \
|
||||
-*O?*) strip_trailopt 'O';; \
|
||||
-*l) strip_trailopt 'l'; skip_next=yes;; \
|
||||
-*l?*) strip_trailopt 'l';; \
|
||||
-[dEDm]) skip_next=yes;; \
|
||||
-[JT]) skip_next=yes;; \
|
||||
esac; \
|
||||
case $$flg in \
|
||||
*$$target_option*) has_opt=yes; break;; \
|
||||
esac; \
|
||||
done; \
|
||||
test $$has_opt = yes
|
||||
am__make_dryrun = (target_option=n; $(am__make_running_with_option))
|
||||
am__make_keepgoing = (target_option=k; $(am__make_running_with_option))
|
||||
pkgdatadir = $(datadir)/@PACKAGE@
|
||||
pkgincludedir = $(includedir)/@PACKAGE@
|
||||
pkglibdir = $(libdir)/@PACKAGE@
|
||||
pkglibexecdir = $(libexecdir)/@PACKAGE@
|
||||
am__cd = CDPATH="$${ZSH_VERSION+.}$(PATH_SEPARATOR)" && cd
|
||||
install_sh_DATA = $(install_sh) -c -m 644
|
||||
install_sh_PROGRAM = $(install_sh) -c
|
||||
install_sh_SCRIPT = $(install_sh) -c
|
||||
INSTALL_HEADER = $(INSTALL_DATA)
|
||||
transform = $(program_transform_name)
|
||||
NORMAL_INSTALL = :
|
||||
PRE_INSTALL = :
|
||||
POST_INSTALL = :
|
||||
NORMAL_UNINSTALL = :
|
||||
PRE_UNINSTALL = :
|
||||
POST_UNINSTALL = :
|
||||
build_triplet = @build@
|
||||
host_triplet = @host@
|
||||
subdir = src
|
||||
DIST_COMMON = $(srcdir)/Makefile.in $(srcdir)/Makefile.am \
|
||||
$(top_srcdir)/depcomp
|
||||
ACLOCAL_M4 = $(top_srcdir)/aclocal.m4
|
||||
am__aclocal_m4_deps = $(top_srcdir)/m4/ax_check_compile_flag.m4 \
|
||||
$(top_srcdir)/m4/ax_ext.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_avx_xgetbv.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_cpuid.m4 \
|
||||
$(top_srcdir)/m4/libtool.m4 $(top_srcdir)/m4/ltoptions.m4 \
|
||||
$(top_srcdir)/m4/ltsugar.m4 $(top_srcdir)/m4/ltversion.m4 \
|
||||
$(top_srcdir)/m4/lt~obsolete.m4 $(top_srcdir)/configure.ac
|
||||
am__configure_deps = $(am__aclocal_m4_deps) $(CONFIGURE_DEPENDENCIES) \
|
||||
$(ACLOCAL_M4)
|
||||
mkinstalldirs = $(install_sh) -d
|
||||
CONFIG_HEADER = $(top_builddir)/include/config.h
|
||||
CONFIG_CLEAN_FILES =
|
||||
CONFIG_CLEAN_VPATH_FILES =
|
||||
am__vpath_adj_setup = srcdirstrip=`echo "$(srcdir)" | sed 's|.|.|g'`;
|
||||
am__vpath_adj = case $$p in \
|
||||
$(srcdir)/*) f=`echo "$$p" | sed "s|^$$srcdirstrip/||"`;; \
|
||||
*) f=$$p;; \
|
||||
esac;
|
||||
am__strip_dir = f=`echo $$p | sed -e 's|^.*/||'`;
|
||||
am__install_max = 40
|
||||
am__nobase_strip_setup = \
|
||||
srcdirstrip=`echo "$(srcdir)" | sed 's/[].[^$$\\*|]/\\\\&/g'`
|
||||
am__nobase_strip = \
|
||||
for p in $$list; do echo "$$p"; done | sed -e "s|$$srcdirstrip/||"
|
||||
am__nobase_list = $(am__nobase_strip_setup); \
|
||||
for p in $$list; do echo "$$p $$p"; done | \
|
||||
sed "s| $$srcdirstrip/| |;"' / .*\//!s/ .*/ ./; s,\( .*\)/[^/]*$$,\1,' | \
|
||||
$(AWK) 'BEGIN { files["."] = "" } { files[$$2] = files[$$2] " " $$1; \
|
||||
if (++n[$$2] == $(am__install_max)) \
|
||||
{ print $$2, files[$$2]; n[$$2] = 0; files[$$2] = "" } } \
|
||||
END { for (dir in files) print dir, files[dir] }'
|
||||
am__base_list = \
|
||||
sed '$$!N;$$!N;$$!N;$$!N;$$!N;$$!N;$$!N;s/\n/ /g' | \
|
||||
sed '$$!N;$$!N;$$!N;$$!N;s/\n/ /g'
|
||||
am__uninstall_files_from_dir = { \
|
||||
test -z "$$files" \
|
||||
|| { test ! -d "$$dir" && test ! -f "$$dir" && test ! -r "$$dir"; } \
|
||||
|| { echo " ( cd '$$dir' && rm -f" $$files ")"; \
|
||||
$(am__cd) "$$dir" && rm -f $$files; }; \
|
||||
}
|
||||
am__installdirs = "$(DESTDIR)$(libdir)"
|
||||
LTLIBRARIES = $(lib_LTLIBRARIES)
|
||||
libgf_complete_la_LIBADD =
|
||||
am_libgf_complete_la_OBJECTS = gf.lo gf_method.lo gf_wgen.lo gf_w4.lo \
|
||||
gf_w8.lo gf_w16.lo gf_w32.lo gf_w64.lo gf_w128.lo gf_rand.lo \
|
||||
gf_general.lo
|
||||
libgf_complete_la_OBJECTS = $(am_libgf_complete_la_OBJECTS)
|
||||
AM_V_lt = $(am__v_lt_@AM_V@)
|
||||
am__v_lt_ = $(am__v_lt_@AM_DEFAULT_V@)
|
||||
am__v_lt_0 = --silent
|
||||
am__v_lt_1 =
|
||||
libgf_complete_la_LINK = $(LIBTOOL) $(AM_V_lt) --tag=CC \
|
||||
$(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=link $(CCLD) \
|
||||
$(AM_CFLAGS) $(CFLAGS) $(libgf_complete_la_LDFLAGS) $(LDFLAGS) \
|
||||
-o $@
|
||||
AM_V_P = $(am__v_P_@AM_V@)
|
||||
am__v_P_ = $(am__v_P_@AM_DEFAULT_V@)
|
||||
am__v_P_0 = false
|
||||
am__v_P_1 = :
|
||||
AM_V_GEN = $(am__v_GEN_@AM_V@)
|
||||
am__v_GEN_ = $(am__v_GEN_@AM_DEFAULT_V@)
|
||||
am__v_GEN_0 = @echo " GEN " $@;
|
||||
am__v_GEN_1 =
|
||||
AM_V_at = $(am__v_at_@AM_V@)
|
||||
am__v_at_ = $(am__v_at_@AM_DEFAULT_V@)
|
||||
am__v_at_0 = @
|
||||
am__v_at_1 =
|
||||
DEFAULT_INCLUDES = -I.@am__isrc@ -I$(top_builddir)/include
|
||||
depcomp = $(SHELL) $(top_srcdir)/depcomp
|
||||
am__depfiles_maybe = depfiles
|
||||
am__mv = mv -f
|
||||
COMPILE = $(CC) $(DEFS) $(DEFAULT_INCLUDES) $(INCLUDES) $(AM_CPPFLAGS) \
|
||||
$(CPPFLAGS) $(AM_CFLAGS) $(CFLAGS)
|
||||
LTCOMPILE = $(LIBTOOL) $(AM_V_lt) --tag=CC $(AM_LIBTOOLFLAGS) \
|
||||
$(LIBTOOLFLAGS) --mode=compile $(CC) $(DEFS) \
|
||||
$(DEFAULT_INCLUDES) $(INCLUDES) $(AM_CPPFLAGS) $(CPPFLAGS) \
|
||||
$(AM_CFLAGS) $(CFLAGS)
|
||||
AM_V_CC = $(am__v_CC_@AM_V@)
|
||||
am__v_CC_ = $(am__v_CC_@AM_DEFAULT_V@)
|
||||
am__v_CC_0 = @echo " CC " $@;
|
||||
am__v_CC_1 =
|
||||
CCLD = $(CC)
|
||||
LINK = $(LIBTOOL) $(AM_V_lt) --tag=CC $(AM_LIBTOOLFLAGS) \
|
||||
$(LIBTOOLFLAGS) --mode=link $(CCLD) $(AM_CFLAGS) $(CFLAGS) \
|
||||
$(AM_LDFLAGS) $(LDFLAGS) -o $@
|
||||
AM_V_CCLD = $(am__v_CCLD_@AM_V@)
|
||||
am__v_CCLD_ = $(am__v_CCLD_@AM_DEFAULT_V@)
|
||||
am__v_CCLD_0 = @echo " CCLD " $@;
|
||||
am__v_CCLD_1 =
|
||||
SOURCES = $(libgf_complete_la_SOURCES)
|
||||
DIST_SOURCES = $(libgf_complete_la_SOURCES)
|
||||
am__can_run_installinfo = \
|
||||
case $$AM_UPDATE_INFO_DIR in \
|
||||
n|no|NO) false;; \
|
||||
*) (install-info --version) >/dev/null 2>&1;; \
|
||||
esac
|
||||
am__tagged_files = $(HEADERS) $(SOURCES) $(TAGS_FILES) $(LISP)
|
||||
# Read a list of newline-separated strings from the standard input,
|
||||
# and print each of them once, without duplicates. Input order is
|
||||
# *not* preserved.
|
||||
am__uniquify_input = $(AWK) '\
|
||||
BEGIN { nonempty = 0; } \
|
||||
{ items[$$0] = 1; nonempty = 1; } \
|
||||
END { if (nonempty) { for (i in items) print i; }; } \
|
||||
'
|
||||
# Make sure the list of sources is unique. This is necessary because,
|
||||
# e.g., the same source file might be shared among _SOURCES variables
|
||||
# for different programs/libraries.
|
||||
am__define_uniq_tagged_files = \
|
||||
list='$(am__tagged_files)'; \
|
||||
unique=`for i in $$list; do \
|
||||
if test -f "$$i"; then echo $$i; else echo $(srcdir)/$$i; fi; \
|
||||
done | $(am__uniquify_input)`
|
||||
ETAGS = etags
|
||||
CTAGS = ctags
|
||||
DISTFILES = $(DIST_COMMON) $(DIST_SOURCES) $(TEXINFOS) $(EXTRA_DIST)
|
||||
ACLOCAL = @ACLOCAL@
|
||||
AMTAR = @AMTAR@
|
||||
AM_DEFAULT_VERBOSITY = @AM_DEFAULT_VERBOSITY@
|
||||
AR = @AR@
|
||||
AUTOCONF = @AUTOCONF@
|
||||
AUTOHEADER = @AUTOHEADER@
|
||||
AUTOMAKE = @AUTOMAKE@
|
||||
AWK = @AWK@
|
||||
CC = @CC@
|
||||
CCDEPMODE = @CCDEPMODE@
|
||||
CFLAGS = @CFLAGS@
|
||||
CPP = @CPP@
|
||||
CPPFLAGS = @CPPFLAGS@
|
||||
CYGPATH_W = @CYGPATH_W@
|
||||
DEFS = @DEFS@
|
||||
DEPDIR = @DEPDIR@
|
||||
DLLTOOL = @DLLTOOL@
|
||||
DSYMUTIL = @DSYMUTIL@
|
||||
DUMPBIN = @DUMPBIN@
|
||||
ECHO_C = @ECHO_C@
|
||||
ECHO_N = @ECHO_N@
|
||||
ECHO_T = @ECHO_T@
|
||||
EGREP = @EGREP@
|
||||
EXEEXT = @EXEEXT@
|
||||
FGREP = @FGREP@
|
||||
GREP = @GREP@
|
||||
INSTALL = @INSTALL@
|
||||
INSTALL_DATA = @INSTALL_DATA@
|
||||
INSTALL_PROGRAM = @INSTALL_PROGRAM@
|
||||
INSTALL_SCRIPT = @INSTALL_SCRIPT@
|
||||
INSTALL_STRIP_PROGRAM = @INSTALL_STRIP_PROGRAM@
|
||||
LD = @LD@
|
||||
LDFLAGS = @LDFLAGS@
|
||||
LIBOBJS = @LIBOBJS@
|
||||
LIBS = @LIBS@
|
||||
LIBTOOL = @LIBTOOL@
|
||||
LIPO = @LIPO@
|
||||
LN_S = @LN_S@
|
||||
LTLIBOBJS = @LTLIBOBJS@
|
||||
MAINT = @MAINT@
|
||||
MAKEINFO = @MAKEINFO@
|
||||
MANIFEST_TOOL = @MANIFEST_TOOL@
|
||||
MKDIR_P = @MKDIR_P@
|
||||
NM = @NM@
|
||||
NMEDIT = @NMEDIT@
|
||||
OBJDUMP = @OBJDUMP@
|
||||
OBJEXT = @OBJEXT@
|
||||
OTOOL = @OTOOL@
|
||||
OTOOL64 = @OTOOL64@
|
||||
PACKAGE = @PACKAGE@
|
||||
PACKAGE_BUGREPORT = @PACKAGE_BUGREPORT@
|
||||
PACKAGE_NAME = @PACKAGE_NAME@
|
||||
PACKAGE_STRING = @PACKAGE_STRING@
|
||||
PACKAGE_TARNAME = @PACKAGE_TARNAME@
|
||||
PACKAGE_URL = @PACKAGE_URL@
|
||||
PACKAGE_VERSION = @PACKAGE_VERSION@
|
||||
PATH_SEPARATOR = @PATH_SEPARATOR@
|
||||
RANLIB = @RANLIB@
|
||||
SED = @SED@
|
||||
SET_MAKE = @SET_MAKE@
|
||||
SHELL = @SHELL@
|
||||
SIMD_FLAGS = @SIMD_FLAGS@
|
||||
STRIP = @STRIP@
|
||||
VERSION = @VERSION@
|
||||
abs_builddir = @abs_builddir@
|
||||
abs_srcdir = @abs_srcdir@
|
||||
abs_top_builddir = @abs_top_builddir@
|
||||
abs_top_srcdir = @abs_top_srcdir@
|
||||
ac_ct_AR = @ac_ct_AR@
|
||||
ac_ct_CC = @ac_ct_CC@
|
||||
ac_ct_DUMPBIN = @ac_ct_DUMPBIN@
|
||||
am__include = @am__include@
|
||||
am__leading_dot = @am__leading_dot@
|
||||
am__quote = @am__quote@
|
||||
am__tar = @am__tar@
|
||||
am__untar = @am__untar@
|
||||
bindir = @bindir@
|
||||
build = @build@
|
||||
build_alias = @build_alias@
|
||||
build_cpu = @build_cpu@
|
||||
build_os = @build_os@
|
||||
build_vendor = @build_vendor@
|
||||
builddir = @builddir@
|
||||
datadir = @datadir@
|
||||
datarootdir = @datarootdir@
|
||||
docdir = @docdir@
|
||||
dvidir = @dvidir@
|
||||
exec_prefix = @exec_prefix@
|
||||
host = @host@
|
||||
host_alias = @host_alias@
|
||||
host_cpu = @host_cpu@
|
||||
host_os = @host_os@
|
||||
host_vendor = @host_vendor@
|
||||
htmldir = @htmldir@
|
||||
includedir = @includedir@
|
||||
infodir = @infodir@
|
||||
install_sh = @install_sh@
|
||||
libdir = @libdir@
|
||||
libexecdir = @libexecdir@
|
||||
localedir = @localedir@
|
||||
localstatedir = @localstatedir@
|
||||
mandir = @mandir@
|
||||
mkdir_p = @mkdir_p@
|
||||
oldincludedir = @oldincludedir@
|
||||
pdfdir = @pdfdir@
|
||||
prefix = @prefix@
|
||||
program_transform_name = @program_transform_name@
|
||||
psdir = @psdir@
|
||||
sbindir = @sbindir@
|
||||
sharedstatedir = @sharedstatedir@
|
||||
srcdir = @srcdir@
|
||||
sysconfdir = @sysconfdir@
|
||||
target_alias = @target_alias@
|
||||
top_build_prefix = @top_build_prefix@
|
||||
top_builddir = @top_builddir@
|
||||
top_srcdir = @top_srcdir@
|
||||
INCLUDES = -I./ -I../include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
lib_LTLIBRARIES = libgf_complete.la
|
||||
libgf_complete_la_SOURCES = gf.c gf_method.c gf_wgen.c gf_w4.c gf_w8.c gf_w16.c gf_w32.c \
|
||||
gf_w64.c gf_w128.c gf_rand.c gf_general.c
|
||||
|
||||
libgf_complete_la_LDFLAGS = -version-info 1:0:0
|
||||
all: all-am
|
||||
|
||||
.SUFFIXES:
|
||||
.SUFFIXES: .c .lo .o .obj
|
||||
$(srcdir)/Makefile.in: @MAINTAINER_MODE_TRUE@ $(srcdir)/Makefile.am $(am__configure_deps)
|
||||
@for dep in $?; do \
|
||||
case '$(am__configure_deps)' in \
|
||||
*$$dep*) \
|
||||
( cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh ) \
|
||||
&& { if test -f $@; then exit 0; else break; fi; }; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
done; \
|
||||
echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu src/Makefile'; \
|
||||
$(am__cd) $(top_srcdir) && \
|
||||
$(AUTOMAKE) --gnu src/Makefile
|
||||
.PRECIOUS: Makefile
|
||||
Makefile: $(srcdir)/Makefile.in $(top_builddir)/config.status
|
||||
@case '$?' in \
|
||||
*config.status*) \
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh;; \
|
||||
*) \
|
||||
echo ' cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe)'; \
|
||||
cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe);; \
|
||||
esac;
|
||||
|
||||
$(top_builddir)/config.status: $(top_srcdir)/configure $(CONFIG_STATUS_DEPENDENCIES)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
|
||||
$(top_srcdir)/configure: @MAINTAINER_MODE_TRUE@ $(am__configure_deps)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
$(ACLOCAL_M4): @MAINTAINER_MODE_TRUE@ $(am__aclocal_m4_deps)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
$(am__aclocal_m4_deps):
|
||||
|
||||
install-libLTLIBRARIES: $(lib_LTLIBRARIES)
|
||||
@$(NORMAL_INSTALL)
|
||||
@list='$(lib_LTLIBRARIES)'; test -n "$(libdir)" || list=; \
|
||||
list2=; for p in $$list; do \
|
||||
if test -f $$p; then \
|
||||
list2="$$list2 $$p"; \
|
||||
else :; fi; \
|
||||
done; \
|
||||
test -z "$$list2" || { \
|
||||
echo " $(MKDIR_P) '$(DESTDIR)$(libdir)'"; \
|
||||
$(MKDIR_P) "$(DESTDIR)$(libdir)" || exit 1; \
|
||||
echo " $(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=install $(INSTALL) $(INSTALL_STRIP_FLAG) $$list2 '$(DESTDIR)$(libdir)'"; \
|
||||
$(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=install $(INSTALL) $(INSTALL_STRIP_FLAG) $$list2 "$(DESTDIR)$(libdir)"; \
|
||||
}
|
||||
|
||||
uninstall-libLTLIBRARIES:
|
||||
@$(NORMAL_UNINSTALL)
|
||||
@list='$(lib_LTLIBRARIES)'; test -n "$(libdir)" || list=; \
|
||||
for p in $$list; do \
|
||||
$(am__strip_dir) \
|
||||
echo " $(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=uninstall rm -f '$(DESTDIR)$(libdir)/$$f'"; \
|
||||
$(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=uninstall rm -f "$(DESTDIR)$(libdir)/$$f"; \
|
||||
done
|
||||
|
||||
clean-libLTLIBRARIES:
|
||||
-test -z "$(lib_LTLIBRARIES)" || rm -f $(lib_LTLIBRARIES)
|
||||
@list='$(lib_LTLIBRARIES)'; \
|
||||
locs=`for p in $$list; do echo $$p; done | \
|
||||
sed 's|^[^/]*$$|.|; s|/[^/]*$$||; s|$$|/so_locations|' | \
|
||||
sort -u`; \
|
||||
test -z "$$locs" || { \
|
||||
echo rm -f $${locs}; \
|
||||
rm -f $${locs}; \
|
||||
}
|
||||
|
||||
libgf_complete.la: $(libgf_complete_la_OBJECTS) $(libgf_complete_la_DEPENDENCIES) $(EXTRA_libgf_complete_la_DEPENDENCIES)
|
||||
$(AM_V_CCLD)$(libgf_complete_la_LINK) -rpath $(libdir) $(libgf_complete_la_OBJECTS) $(libgf_complete_la_LIBADD) $(LIBS)
|
||||
|
||||
mostlyclean-compile:
|
||||
-rm -f *.$(OBJEXT)
|
||||
|
||||
distclean-compile:
|
||||
-rm -f *.tab.c
|
||||
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_general.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_method.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_rand.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_w128.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_w16.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_w32.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_w4.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_w64.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_w8.Plo@am__quote@
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_wgen.Plo@am__quote@
|
||||
|
||||
.c.o:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(COMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ $<
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Po
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=no @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(COMPILE) -c -o $@ $<
|
||||
|
||||
.c.obj:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(COMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ `$(CYGPATH_W) '$<'`
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Po
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=no @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(COMPILE) -c -o $@ `$(CYGPATH_W) '$<'`
|
||||
|
||||
.c.lo:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(LTCOMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ $<
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Plo
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=yes @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(LTCOMPILE) -c -o $@ $<
|
||||
|
||||
mostlyclean-libtool:
|
||||
-rm -f *.lo
|
||||
|
||||
clean-libtool:
|
||||
-rm -rf .libs _libs
|
||||
|
||||
ID: $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); mkid -fID $$unique
|
||||
tags: tags-am
|
||||
TAGS: tags
|
||||
|
||||
tags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
set x; \
|
||||
here=`pwd`; \
|
||||
$(am__define_uniq_tagged_files); \
|
||||
shift; \
|
||||
if test -z "$(ETAGS_ARGS)$$*$$unique"; then :; else \
|
||||
test -n "$$unique" || unique=$$empty_fix; \
|
||||
if test $$# -gt 0; then \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
"$$@" $$unique; \
|
||||
else \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
$$unique; \
|
||||
fi; \
|
||||
fi
|
||||
ctags: ctags-am
|
||||
|
||||
CTAGS: ctags
|
||||
ctags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); \
|
||||
test -z "$(CTAGS_ARGS)$$unique" \
|
||||
|| $(CTAGS) $(CTAGSFLAGS) $(AM_CTAGSFLAGS) $(CTAGS_ARGS) \
|
||||
$$unique
|
||||
|
||||
GTAGS:
|
||||
here=`$(am__cd) $(top_builddir) && pwd` \
|
||||
&& $(am__cd) $(top_srcdir) \
|
||||
&& gtags -i $(GTAGS_ARGS) "$$here"
|
||||
cscopelist: cscopelist-am
|
||||
|
||||
cscopelist-am: $(am__tagged_files)
|
||||
list='$(am__tagged_files)'; \
|
||||
case "$(srcdir)" in \
|
||||
[\\/]* | ?:[\\/]*) sdir="$(srcdir)" ;; \
|
||||
*) sdir=$(subdir)/$(srcdir) ;; \
|
||||
esac; \
|
||||
for i in $$list; do \
|
||||
if test -f "$$i"; then \
|
||||
echo "$(subdir)/$$i"; \
|
||||
else \
|
||||
echo "$$sdir/$$i"; \
|
||||
fi; \
|
||||
done >> $(top_builddir)/cscope.files
|
||||
|
||||
distclean-tags:
|
||||
-rm -f TAGS ID GTAGS GRTAGS GSYMS GPATH tags
|
||||
|
||||
distdir: $(DISTFILES)
|
||||
@srcdirstrip=`echo "$(srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
topsrcdirstrip=`echo "$(top_srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
list='$(DISTFILES)'; \
|
||||
dist_files=`for file in $$list; do echo $$file; done | \
|
||||
sed -e "s|^$$srcdirstrip/||;t" \
|
||||
-e "s|^$$topsrcdirstrip/|$(top_builddir)/|;t"`; \
|
||||
case $$dist_files in \
|
||||
*/*) $(MKDIR_P) `echo "$$dist_files" | \
|
||||
sed '/\//!d;s|^|$(distdir)/|;s,/[^/]*$$,,' | \
|
||||
sort -u` ;; \
|
||||
esac; \
|
||||
for file in $$dist_files; do \
|
||||
if test -f $$file || test -d $$file; then d=.; else d=$(srcdir); fi; \
|
||||
if test -d $$d/$$file; then \
|
||||
dir=`echo "/$$file" | sed -e 's,/[^/]*$$,,'`; \
|
||||
if test -d "$(distdir)/$$file"; then \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
if test -d $(srcdir)/$$file && test $$d != $(srcdir); then \
|
||||
cp -fpR $(srcdir)/$$file "$(distdir)$$dir" || exit 1; \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
cp -fpR $$d/$$file "$(distdir)$$dir" || exit 1; \
|
||||
else \
|
||||
test -f "$(distdir)/$$file" \
|
||||
|| cp -p $$d/$$file "$(distdir)/$$file" \
|
||||
|| exit 1; \
|
||||
fi; \
|
||||
done
|
||||
check-am: all-am
|
||||
check: check-am
|
||||
all-am: Makefile $(LTLIBRARIES)
|
||||
installdirs:
|
||||
for dir in "$(DESTDIR)$(libdir)"; do \
|
||||
test -z "$$dir" || $(MKDIR_P) "$$dir"; \
|
||||
done
|
||||
install: install-am
|
||||
install-exec: install-exec-am
|
||||
install-data: install-data-am
|
||||
uninstall: uninstall-am
|
||||
|
||||
install-am: all-am
|
||||
@$(MAKE) $(AM_MAKEFLAGS) install-exec-am install-data-am
|
||||
|
||||
installcheck: installcheck-am
|
||||
install-strip:
|
||||
if test -z '$(STRIP)'; then \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
install; \
|
||||
else \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
"INSTALL_PROGRAM_ENV=STRIPPROG='$(STRIP)'" install; \
|
||||
fi
|
||||
mostlyclean-generic:
|
||||
|
||||
clean-generic:
|
||||
|
||||
distclean-generic:
|
||||
-test -z "$(CONFIG_CLEAN_FILES)" || rm -f $(CONFIG_CLEAN_FILES)
|
||||
-test . = "$(srcdir)" || test -z "$(CONFIG_CLEAN_VPATH_FILES)" || rm -f $(CONFIG_CLEAN_VPATH_FILES)
|
||||
|
||||
maintainer-clean-generic:
|
||||
@echo "This command is intended for maintainers to use"
|
||||
@echo "it deletes files that may require special tools to rebuild."
|
||||
clean: clean-am
|
||||
|
||||
clean-am: clean-generic clean-libLTLIBRARIES clean-libtool \
|
||||
mostlyclean-am
|
||||
|
||||
distclean: distclean-am
|
||||
-rm -rf ./$(DEPDIR)
|
||||
-rm -f Makefile
|
||||
distclean-am: clean-am distclean-compile distclean-generic \
|
||||
distclean-tags
|
||||
|
||||
dvi: dvi-am
|
||||
|
||||
dvi-am:
|
||||
|
||||
html: html-am
|
||||
|
||||
html-am:
|
||||
|
||||
info: info-am
|
||||
|
||||
info-am:
|
||||
|
||||
install-data-am:
|
||||
|
||||
install-dvi: install-dvi-am
|
||||
|
||||
install-dvi-am:
|
||||
|
||||
install-exec-am: install-libLTLIBRARIES
|
||||
|
||||
install-html: install-html-am
|
||||
|
||||
install-html-am:
|
||||
|
||||
install-info: install-info-am
|
||||
|
||||
install-info-am:
|
||||
|
||||
install-man:
|
||||
|
||||
install-pdf: install-pdf-am
|
||||
|
||||
install-pdf-am:
|
||||
|
||||
install-ps: install-ps-am
|
||||
|
||||
install-ps-am:
|
||||
|
||||
installcheck-am:
|
||||
|
||||
maintainer-clean: maintainer-clean-am
|
||||
-rm -rf ./$(DEPDIR)
|
||||
-rm -f Makefile
|
||||
maintainer-clean-am: distclean-am maintainer-clean-generic
|
||||
|
||||
mostlyclean: mostlyclean-am
|
||||
|
||||
mostlyclean-am: mostlyclean-compile mostlyclean-generic \
|
||||
mostlyclean-libtool
|
||||
|
||||
pdf: pdf-am
|
||||
|
||||
pdf-am:
|
||||
|
||||
ps: ps-am
|
||||
|
||||
ps-am:
|
||||
|
||||
uninstall-am: uninstall-libLTLIBRARIES
|
||||
|
||||
.MAKE: install-am install-strip
|
||||
|
||||
.PHONY: CTAGS GTAGS TAGS all all-am check check-am clean clean-generic \
|
||||
clean-libLTLIBRARIES clean-libtool cscopelist-am ctags \
|
||||
ctags-am distclean distclean-compile distclean-generic \
|
||||
distclean-libtool distclean-tags distdir dvi dvi-am html \
|
||||
html-am info info-am install install-am install-data \
|
||||
install-data-am install-dvi install-dvi-am install-exec \
|
||||
install-exec-am install-html install-html-am install-info \
|
||||
install-info-am install-libLTLIBRARIES install-man install-pdf \
|
||||
install-pdf-am install-ps install-ps-am install-strip \
|
||||
installcheck installcheck-am installdirs maintainer-clean \
|
||||
maintainer-clean-generic mostlyclean mostlyclean-compile \
|
||||
mostlyclean-generic mostlyclean-libtool pdf pdf-am ps ps-am \
|
||||
tags tags-am uninstall uninstall-am uninstall-libLTLIBRARIES
|
||||
|
||||
|
||||
# Tell versions [3.59,3.63) of GNU make to not export all variables.
|
||||
# Otherwise a system limit (for SysV at least) may be exceeded.
|
||||
.NOEXPORT:
|
241
src/gf.c
|
@ -11,6 +11,8 @@
|
|||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <assert.h>
|
||||
#include "gf_cpu.h"
|
||||
|
||||
int _gf_errno = GF_E_DEFAULT;
|
||||
|
||||
|
@ -41,7 +43,7 @@ void gf_error()
|
|||
case GF_E_MDEFARG: s = "If multiplication method == default, can't use arg1/arg2."; break;
|
||||
case GF_E_DIVCOMP: s = "Cannot change the division technique with -m COMPOSITE."; break;
|
||||
case GF_E_DOUQUAD: s = "Cannot specify -r DOUBLE and -r QUAD."; break;
|
||||
case GF_E_SSE__NO: s = "Cannot specify -r SSE and -r NOSSE."; break;
|
||||
case GF_E_SIMD_NO: s = "Cannot specify -r SIMD and -r NOSIMD."; break;
|
||||
case GF_E_CAUCHYB: s = "Cannot specify -r CAUCHY and any other -r."; break;
|
||||
case GF_E_CAUCOMP: s = "Cannot specify -m COMPOSITE and -r CAUCHY."; break;
|
||||
case GF_E_CAUGT32: s = "Cannot specify -r CAUCHY with w > 32."; break;
|
||||
|
@ -51,23 +53,23 @@ void gf_error()
|
|||
case GF_E_BAD___W: s = "W must be 1-32, 64 or 128."; break;
|
||||
case GF_E_DOUBLET: s = "Can only specify -r DOUBLE with -m TABLE."; break;
|
||||
case GF_E_DOUBLEW: s = "Can only specify -r DOUBLE w = 4 or w = 8."; break;
|
||||
case GF_E_DOUBLEJ: s = "Cannot specify -r DOUBLE with -r ALTMAP|SSE|NOSSE."; break;
|
||||
case GF_E_DOUBLEJ: s = "Cannot specify -r DOUBLE with -r ALTMAP|SIMD|NOSIMD."; break;
|
||||
case GF_E_DOUBLEL: s = "Can only specify -r DOUBLE -r LAZY with w = 8"; break;
|
||||
case GF_E_QUAD__T: s = "Can only specify -r QUAD with -m TABLE."; break;
|
||||
case GF_E_QUAD__W: s = "Can only specify -r QUAD w = 4."; break;
|
||||
case GF_E_QUAD__J: s = "Cannot specify -r QUAD with -r ALTMAP|SSE|NOSSE."; break;
|
||||
case GF_E_QUAD__J: s = "Cannot specify -r QUAD with -r ALTMAP|SIMD|NOSIMD."; break;
|
||||
case GF_E_BADPOLY: s = "Bad primitive polynomial (high bits set)."; break;
|
||||
case GF_E_COMP_PP: s = "Bad primitive polynomial -- bigger than sub-field."; break;
|
||||
case GF_E_LAZY__X: s = "If -r LAZY, then -r must be DOUBLE or QUAD."; break;
|
||||
case GF_E_ALTSHIF: s = "Cannot specify -m SHIFT and -r ALTMAP."; break;
|
||||
case GF_E_SSESHIF: s = "Cannot specify -m SHIFT and -r SSE|NOSSE."; break;
|
||||
case GF_E_SSESHIF: s = "Cannot specify -m SHIFT and -r SIMD|NOSIMD."; break;
|
||||
case GF_E_ALT_CFM: s = "Cannot specify -m CARRY_FREE and -r ALTMAP."; break;
|
||||
case GF_E_SSE_CFM: s = "Cannot specify -m CARRY_FREE and -r SSE|NOSSE."; break;
|
||||
case GF_E_SSE_CFM: s = "Cannot specify -m CARRY_FREE and -r SIMD|NOSIMD."; break;
|
||||
case GF_E_PCLMULX: s = "Specified -m CARRY_FREE, but PCLMUL is not supported."; break;
|
||||
case GF_E_ALT_BY2: s = "Cannot specify -m BYTWO_x and -r ALTMAP."; break;
|
||||
case GF_E_BY2_SSE: s = "Specified -m BYTWO_x -r SSE, but SSE2 is not supported."; break;
|
||||
case GF_E_BY2_SSE: s = "Specified -m BYTWO_x -r SIMD, but SSE2 is not supported."; break;
|
||||
case GF_E_LOGBADW: s = "With Log Tables, w must be <= 27."; break;
|
||||
case GF_E_LOG___J: s = "Cannot use Log tables with -r ALTMAP|SSE|NOSSE."; break;
|
||||
case GF_E_LOG___J: s = "Cannot use Log tables with -r ALTMAP|SIMD|NOSIMD."; break;
|
||||
case GF_E_LOGPOLY: s = "Cannot use Log tables because the polynomial is not primitive."; break;
|
||||
case GF_E_ZERBADW: s = "With -m LOG_ZERO, w must be 8 or 16."; break;
|
||||
case GF_E_ZEXBADW: s = "With -m LOG_ZERO_EXT, w must be 8."; break;
|
||||
|
@ -77,33 +79,33 @@ void gf_error()
|
|||
case GF_E_GR_128A: s = "With -m GROUP, w == 128, arg1 must be 4, and arg2 in { 4,8,16 }."; break;
|
||||
case GF_E_GR_A_27: s = "With -m GROUP, arg1 and arg2 must be <= 27."; break;
|
||||
case GF_E_GR_AR_W: s = "With -m GROUP, arg1 and arg2 must be <= w."; break;
|
||||
case GF_E_GR____J: s = "Cannot use GROUP with -r ALTMAP|SSE|NOSSE."; break;
|
||||
case GF_E_GR____J: s = "Cannot use GROUP with -r ALTMAP|SIMD|NOSIMD."; break;
|
||||
case GF_E_TABLE_W: s = "With -m TABLE, w must be < 15, or == 16."; break;
|
||||
case GF_E_TAB_SSE: s = "With -m TABLE, SSE|NOSSE only applies to w=4."; break;
|
||||
case GF_E_TABSSE3: s = "With -m TABLE, -r SSE, you need SSSE3 supported."; break;
|
||||
case GF_E_TAB_SSE: s = "With -m TABLE, SIMD|NOSIMD only applies to w=4."; break;
|
||||
case GF_E_TABSSE3: s = "With -m TABLE, -r SIMD, you need SSSE3 supported."; break;
|
||||
case GF_E_TAB_ALT: s = "With -m TABLE, you cannot use ALTMAP."; break;
|
||||
case GF_E_SP128AR: s = "With -m SPLIT, w=128, bad arg1/arg2."; break;
|
||||
case GF_E_SP128AL: s = "With -m SPLIT, w=128, -r SSE requires -r ALTMAP."; break;
|
||||
case GF_E_SP128AL: s = "With -m SPLIT, w=128, -r SIMD requires -r ALTMAP."; break;
|
||||
case GF_E_SP128AS: s = "With -m SPLIT, w=128, ALTMAP needs SSSE3 supported."; break;
|
||||
case GF_E_SP128_A: s = "With -m SPLIT, w=128, -r ALTMAP only with arg1/arg2 = 4/128."; break;
|
||||
case GF_E_SP128_S: s = "With -m SPLIT, w=128, -r SSE|NOSSE only with arg1/arg2 = 4/128."; break;
|
||||
case GF_E_SP128_S: s = "With -m SPLIT, w=128, -r SIMD|NOSIMD only with arg1/arg2 = 4/128."; break;
|
||||
case GF_E_SPLIT_W: s = "With -m SPLIT, w must be in {8, 16, 32, 64, 128}."; break;
|
||||
case GF_E_SP_16AR: s = "With -m SPLIT, w=16, Bad arg1/arg2."; break;
|
||||
case GF_E_SP_16_A: s = "With -m SPLIT, w=16, -r ALTMAP only with arg1/arg2 = 4/16."; break;
|
||||
case GF_E_SP_16_S: s = "With -m SPLIT, w=16, -r SSE|NOSSE only with arg1/arg2 = 4/16."; break;
|
||||
case GF_E_SP_16_S: s = "With -m SPLIT, w=16, -r SIMD|NOSIMD only with arg1/arg2 = 4/16."; break;
|
||||
case GF_E_SP_32AR: s = "With -m SPLIT, w=32, Bad arg1/arg2."; break;
|
||||
case GF_E_SP_32AS: s = "With -m SPLIT, w=32, -r ALTMAP needs SSSE3 supported."; break;
|
||||
case GF_E_SP_32_A: s = "With -m SPLIT, w=32, -r ALTMAP only with arg1/arg2 = 4/32."; break;
|
||||
case GF_E_SP_32_S: s = "With -m SPLIT, w=32, -r SSE|NOSSE only with arg1/arg2 = 4/32."; break;
|
||||
case GF_E_SP_32_S: s = "With -m SPLIT, w=32, -r SIMD|NOSIMD only with arg1/arg2 = 4/32."; break;
|
||||
case GF_E_SP_64AR: s = "With -m SPLIT, w=64, Bad arg1/arg2."; break;
|
||||
case GF_E_SP_64AS: s = "With -m SPLIT, w=64, -r ALTMAP needs SSSE3 supported."; break;
|
||||
case GF_E_SP_64_A: s = "With -m SPLIT, w=64, -r ALTMAP only with arg1/arg2 = 4/64."; break;
|
||||
case GF_E_SP_64_S: s = "With -m SPLIT, w=64, -r SSE|NOSSE only with arg1/arg2 = 4/64."; break;
|
||||
case GF_E_SP_64_S: s = "With -m SPLIT, w=64, -r SIMD|NOSIMD only with arg1/arg2 = 4/64."; break;
|
||||
case GF_E_SP_8_AR: s = "With -m SPLIT, w=8, Bad arg1/arg2."; break;
|
||||
case GF_E_SP_8__A: s = "With -m SPLIT, w=8, Can't have -r ALTMAP."; break;
|
||||
case GF_E_SP_SSE3: s = "With -m SPLIT, Need SSSE3 support for SSE."; break;
|
||||
case GF_E_SP_SSE3: s = "With -m SPLIT, Need SSSE3 support for SIMD."; break;
|
||||
case GF_E_COMP_A2: s = "With -m COMPOSITE, arg1 must equal 2."; break;
|
||||
case GF_E_COMP_SS: s = "With -m COMPOSITE, -r SSE and -r NOSSE do not apply."; break;
|
||||
case GF_E_COMP_SS: s = "With -m COMPOSITE, -r SIMD and -r NOSIMD do not apply."; break;
|
||||
case GF_E_COMP__W: s = "With -m COMPOSITE, w must be 8, 16, 32, 64 or 128."; break;
|
||||
case GF_E_UNKFLAG: s = "Unknown method flag - should be -m, -d, -r or -p."; break;
|
||||
case GF_E_UNKNOWN: s = "Unknown multiplication type."; break;
|
||||
|
@ -118,7 +120,7 @@ void gf_error()
|
|||
uint64_t gf_composite_get_default_poly(gf_t *base)
|
||||
{
|
||||
gf_internal_t *h;
|
||||
int rv;
|
||||
uint64_t rv;
|
||||
|
||||
h = (gf_internal_t *) base->scratch;
|
||||
if (h->w == 4) {
|
||||
|
@ -182,14 +184,14 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
int sse3 = 0;
|
||||
int sse2 = 0;
|
||||
int pclmul = 0;
|
||||
int rdouble, rquad, rlazy, rsse, rnosse, raltmap, rcauchy, tmp;
|
||||
int rdouble, rquad, rlazy, rsimd, rnosimd, raltmap, rcauchy, tmp;
|
||||
gf_internal_t *sub;
|
||||
|
||||
rdouble = (region_type & GF_REGION_DOUBLE_TABLE);
|
||||
rquad = (region_type & GF_REGION_QUAD_TABLE);
|
||||
rlazy = (region_type & GF_REGION_LAZY);
|
||||
rsse = (region_type & GF_REGION_SSE);
|
||||
rnosse = (region_type & GF_REGION_NOSSE);
|
||||
rsimd = (region_type & GF_REGION_SIMD);
|
||||
rnosimd = (region_type & GF_REGION_NOSIMD);
|
||||
raltmap = (region_type & GF_REGION_ALTMAP);
|
||||
rcauchy = (region_type & GF_REGION_CAUCHY);
|
||||
|
||||
|
@ -201,19 +203,33 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
}
|
||||
|
||||
tmp = ( GF_REGION_DOUBLE_TABLE | GF_REGION_QUAD_TABLE | GF_REGION_LAZY |
|
||||
GF_REGION_SSE | GF_REGION_NOSSE | GF_REGION_ALTMAP | GF_REGION_CAUCHY );
|
||||
GF_REGION_SIMD | GF_REGION_NOSIMD | GF_REGION_ALTMAP |
|
||||
GF_REGION_CAUCHY );
|
||||
if (region_type & (~tmp)) { _gf_errno = GF_E_UNK_REG; return 0; }
|
||||
|
||||
#ifdef INTEL_SSE2
|
||||
sse2 = 1;
|
||||
if (gf_cpu_supports_intel_sse2) {
|
||||
sse2 = 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
sse3 = 1;
|
||||
if (gf_cpu_supports_intel_ssse3) {
|
||||
sse3 = 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef INTEL_SSE4_PCLMUL
|
||||
pclmul = 1;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
pclmul = 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef ARM_NEON
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
pclmul = (w == 4 || w == 8);
|
||||
sse3 = 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
|
@ -230,7 +246,7 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
return 1;
|
||||
}
|
||||
|
||||
if (rsse && rnosse) { _gf_errno = GF_E_SSE__NO; return 0; }
|
||||
if (rsimd && rnosimd) { _gf_errno = GF_E_SIMD_NO; return 0; }
|
||||
if (rcauchy && w > 32) { _gf_errno = GF_E_CAUGT32; return 0; }
|
||||
if (rcauchy && region_type != GF_REGION_CAUCHY) { _gf_errno = GF_E_CAUCHYB; return 0; }
|
||||
if (rcauchy && mult_type == GF_MULT_COMPOSITE) { _gf_errno = GF_E_CAUCOMP; return 0; }
|
||||
|
@ -252,7 +268,7 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
if (rquad) { _gf_errno = GF_E_DOUQUAD; return 0; }
|
||||
if (mult_type != GF_MULT_TABLE) { _gf_errno = GF_E_DOUBLET; return 0; }
|
||||
if (w != 4 && w != 8) { _gf_errno = GF_E_DOUBLEW; return 0; }
|
||||
if (rsse || rnosse || raltmap) { _gf_errno = GF_E_DOUBLEJ; return 0; }
|
||||
if (rsimd || rnosimd || raltmap) { _gf_errno = GF_E_DOUBLEJ; return 0; }
|
||||
if (rlazy && w == 4) { _gf_errno = GF_E_DOUBLEL; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
@ -260,7 +276,7 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
if (rquad) {
|
||||
if (mult_type != GF_MULT_TABLE) { _gf_errno = GF_E_QUAD__T; return 0; }
|
||||
if (w != 4) { _gf_errno = GF_E_QUAD__W; return 0; }
|
||||
if (rsse || rnosse || raltmap) { _gf_errno = GF_E_QUAD__J; return 0; }
|
||||
if (rsimd || rnosimd || raltmap) { _gf_errno = GF_E_QUAD__J; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -268,7 +284,7 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
|
||||
if (mult_type == GF_MULT_SHIFT) {
|
||||
if (raltmap) { _gf_errno = GF_E_ALTSHIF; return 0; }
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_SSESHIF; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_SSESHIF; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -281,31 +297,30 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
if (w == 32 && (poly & 0xfe000000)) { _gf_errno = GF_E_CF32POL; return 0; }
|
||||
if (w == 64 && (poly & 0xfffe000000000000ULL)) { _gf_errno = GF_E_CF64POL; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_ALT_CFM; return 0; }
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_SSE_CFM; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_SSE_CFM; return 0; }
|
||||
if (!pclmul) { _gf_errno = GF_E_PCLMULX; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
||||
//ADAM
|
||||
if (mult_type == GF_MULT_CARRY_FREE_GK) {
|
||||
if (w != 4 && w != 8 && w != 16 &&
|
||||
w != 32 && w != 64 && w != 128) { _gf_errno = GF_E_CFM___W; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_ALT_CFM; return 0; }
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_SSE_CFM; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_SSE_CFM; return 0; }
|
||||
if (!pclmul) { _gf_errno = GF_E_PCLMULX; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
||||
if (mult_type == GF_MULT_BYTWO_p || mult_type == GF_MULT_BYTWO_b) {
|
||||
if (raltmap) { _gf_errno = GF_E_ALT_BY2; return 0; }
|
||||
if (rsse && !sse2) { _gf_errno = GF_E_BY2_SSE; return 0; }
|
||||
if (rsimd && !sse2) { _gf_errno = GF_E_BY2_SSE; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
||||
if (mult_type == GF_MULT_LOG_TABLE || mult_type == GF_MULT_LOG_ZERO
|
||||
|| mult_type == GF_MULT_LOG_ZERO_EXT ) {
|
||||
if (w > 27) { _gf_errno = GF_E_LOGBADW; return 0; }
|
||||
if (raltmap || rsse || rnosse) { _gf_errno = GF_E_LOG___J; return 0; }
|
||||
if (raltmap || rsimd || rnosimd) { _gf_errno = GF_E_LOG___J; return 0; }
|
||||
|
||||
if (mult_type == GF_MULT_LOG_TABLE) return 1;
|
||||
|
||||
|
@ -325,14 +340,14 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
(arg2 != 4 && arg2 != 8 && arg2 != 16))) { _gf_errno = GF_E_GR_128A; return 0; }
|
||||
if (arg1 > 27 || arg2 > 27) { _gf_errno = GF_E_GR_A_27; return 0; }
|
||||
if (arg1 > w || arg2 > w) { _gf_errno = GF_E_GR_AR_W; return 0; }
|
||||
if (raltmap || rsse || rnosse) { _gf_errno = GF_E_GR____J; return 0; }
|
||||
if (raltmap || rsimd || rnosimd) { _gf_errno = GF_E_GR____J; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
||||
if (mult_type == GF_MULT_TABLE) {
|
||||
if (w != 16 && w >= 15) { _gf_errno = GF_E_TABLE_W; return 0; }
|
||||
if (w != 4 && (rsse || rnosse)) { _gf_errno = GF_E_TAB_SSE; return 0; }
|
||||
if (rsse && !sse3) { _gf_errno = GF_E_TABSSE3; return 0; }
|
||||
if (w != 4 && (rsimd || rnosimd)) { _gf_errno = GF_E_TAB_SSE; return 0; }
|
||||
if (rsimd && !sse3) { _gf_errno = GF_E_TABSSE3; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_TAB_ALT; return 0; }
|
||||
return 1;
|
||||
}
|
||||
|
@ -345,46 +360,46 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
}
|
||||
if (w == 8) {
|
||||
if (arg1 != 4 || arg2 != 8) { _gf_errno = GF_E_SP_8_AR; return 0; }
|
||||
if (rsse && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (rsimd && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_SP_8__A; return 0; }
|
||||
} else if (w == 16) {
|
||||
if ((arg1 == 8 && arg2 == 8) ||
|
||||
(arg1 == 8 && arg2 == 16)) {
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_SP_16_S; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_SP_16_S; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_SP_16_A; return 0; }
|
||||
} else if (arg1 == 4 && arg2 == 16) {
|
||||
if (rsse && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (rsimd && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
} else { _gf_errno = GF_E_SP_16AR; return 0; }
|
||||
} else if (w == 32) {
|
||||
if ((arg1 == 8 && arg2 == 8) ||
|
||||
(arg1 == 8 && arg2 == 32) ||
|
||||
(arg1 == 16 && arg2 == 32)) {
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_SP_32_S; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_SP_32_S; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_SP_32_A; return 0; }
|
||||
} else if (arg1 == 4 && arg2 == 32) {
|
||||
if (rsse && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (rsimd && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (raltmap && !sse3) { _gf_errno = GF_E_SP_32AS; return 0; }
|
||||
if (raltmap && rnosse) { _gf_errno = GF_E_SP_32AS; return 0; }
|
||||
if (raltmap && rnosimd) { _gf_errno = GF_E_SP_32AS; return 0; }
|
||||
} else { _gf_errno = GF_E_SP_32AR; return 0; }
|
||||
} else if (w == 64) {
|
||||
if ((arg1 == 8 && arg2 == 8) ||
|
||||
(arg1 == 8 && arg2 == 64) ||
|
||||
(arg1 == 16 && arg2 == 64)) {
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_SP_64_S; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_SP_64_S; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_SP_64_A; return 0; }
|
||||
} else if (arg1 == 4 && arg2 == 64) {
|
||||
if (rsse && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (rsimd && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (raltmap && !sse3) { _gf_errno = GF_E_SP_64AS; return 0; }
|
||||
if (raltmap && rnosse) { _gf_errno = GF_E_SP_64AS; return 0; }
|
||||
if (raltmap && rnosimd) { _gf_errno = GF_E_SP_64AS; return 0; }
|
||||
} else { _gf_errno = GF_E_SP_64AR; return 0; }
|
||||
} else if (w == 128) {
|
||||
if (arg1 == 8 && arg2 == 128) {
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_SP128_S; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_SP128_S; return 0; }
|
||||
if (raltmap) { _gf_errno = GF_E_SP128_A; return 0; }
|
||||
} else if (arg1 == 4 && arg2 == 128) {
|
||||
if (rsse && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (rsimd && !sse3) { _gf_errno = GF_E_SP_SSE3; return 0; }
|
||||
if (raltmap && !sse3) { _gf_errno = GF_E_SP128AS; return 0; }
|
||||
if (raltmap && rnosse) { _gf_errno = GF_E_SP128AS; return 0; }
|
||||
if (raltmap && rnosimd) { _gf_errno = GF_E_SP128AS; return 0; }
|
||||
} else { _gf_errno = GF_E_SP128AR; return 0; }
|
||||
} else { _gf_errno = GF_E_SPLIT_W; return 0; }
|
||||
return 1;
|
||||
|
@ -393,10 +408,10 @@ int gf_error_check(int w, int mult_type, int region_type, int divide_type,
|
|||
if (mult_type == GF_MULT_COMPOSITE) {
|
||||
if (w != 8 && w != 16 && w != 32
|
||||
&& w != 64 && w != 128) { _gf_errno = GF_E_COMP__W; return 0; }
|
||||
if ((poly >> (w/2)) != 0) { _gf_errno = GF_E_COMP_PP; return 0; }
|
||||
if (w < 128 && (poly >> (w/2)) != 0) { _gf_errno = GF_E_COMP_PP; return 0; }
|
||||
if (divide_type != GF_DIVIDE_DEFAULT) { _gf_errno = GF_E_DIVCOMP; return 0; }
|
||||
if (arg1 != 2) { _gf_errno = GF_E_COMP_A2; return 0; }
|
||||
if (rsse || rnosse) { _gf_errno = GF_E_COMP_SS; return 0; }
|
||||
if (rsimd || rnosimd) { _gf_errno = GF_E_COMP_SS; return 0; }
|
||||
if (base != NULL) {
|
||||
sub = (gf_internal_t *) base->scratch;
|
||||
if (sub->w != w/2) { _gf_errno = GF_E_BASE__W; return 0; }
|
||||
|
@ -467,6 +482,8 @@ int gf_init_hard(gf_t *gf, int w, int mult_type,
|
|||
int sz;
|
||||
gf_internal_t *h;
|
||||
|
||||
gf_cpu_identify();
|
||||
|
||||
if (gf_error_check(w, mult_type, region_type, divide_type,
|
||||
arg1, arg2, prim_poly, base_gf) == 0) return 0;
|
||||
|
||||
|
@ -523,7 +540,7 @@ void gf_alignment_error(char *s, int a)
|
|||
fprintf(stderr, "Alignment error in %s:\n", s);
|
||||
fprintf(stderr, " The source and destination buffers must be aligned to each other,\n");
|
||||
fprintf(stderr, " and they must be aligned to a %d-byte address.\n", a);
|
||||
exit(1);
|
||||
assert(0);
|
||||
}
|
||||
|
||||
static
|
||||
|
@ -546,7 +563,7 @@ void gf_invert_binary_matrix(uint32_t *mat, uint32_t *inv, int rows) {
|
|||
for (j = i+1; j < rows && (mat[j] & (1 << i)) == 0; j++) ;
|
||||
if (j == rows) {
|
||||
fprintf(stderr, "galois_invert_matrix: Matrix not invertible!!\n");
|
||||
exit(1);
|
||||
assert(0);
|
||||
}
|
||||
tmp = mat[i]; mat[i] = mat[j]; mat[j] = tmp;
|
||||
tmp = inv[i]; inv[i] = inv[j]; inv[j] = tmp;
|
||||
|
@ -578,7 +595,7 @@ uint32_t gf_bitmatrix_inverse(uint32_t y, int w, uint32_t pp)
|
|||
uint32_t mat[32], inv[32], mask;
|
||||
int i;
|
||||
|
||||
mask = (w == 32) ? 0xffffffff : (1 << w) - 1;
|
||||
mask = (w == 32) ? 0xffffffff : ((uint32_t)1 << w) - 1;
|
||||
for (i = 0; i < w; i++) {
|
||||
mat[i] = y;
|
||||
|
||||
|
@ -807,7 +824,7 @@ void gf_set_region_data(gf_region_data *rd,
|
|||
if (h != NULL && bytes % h->w != 0) {
|
||||
fprintf(stderr, "Error in region multiply operation.\n");
|
||||
fprintf(stderr, "The size must be a multiple of %d bytes.\n", h->w);
|
||||
exit(1);
|
||||
assert(0);
|
||||
}
|
||||
|
||||
rd->s_start = src;
|
||||
|
@ -823,7 +840,7 @@ void gf_set_region_data(gf_region_data *rd,
|
|||
fprintf(stderr, "to each other along a %d byte boundary.\n", a);
|
||||
fprintf(stderr, "Src = 0x%lx. Dest = 0x%lx\n", (unsigned long) src,
|
||||
(unsigned long) dest);
|
||||
exit(1);
|
||||
assert(0);
|
||||
}
|
||||
|
||||
if (uls % wb != 0) {
|
||||
|
@ -831,13 +848,13 @@ void gf_set_region_data(gf_region_data *rd,
|
|||
fprintf(stderr, "The pointers must be aligned along a %d byte boundary.\n", wb);
|
||||
fprintf(stderr, "Src = 0x%lx. Dest = 0x%lx\n", (unsigned long) src,
|
||||
(unsigned long) dest);
|
||||
exit(1);
|
||||
assert(0);
|
||||
}
|
||||
|
||||
if (bytes % wb != 0) {
|
||||
fprintf(stderr, "Error in region multiply operation.\n");
|
||||
fprintf(stderr, "The size must be a multiple of %d bytes.\n", wb);
|
||||
exit(1);
|
||||
assert(0);
|
||||
}
|
||||
|
||||
uls %= a;
|
||||
|
@ -895,66 +912,104 @@ static void gf_unaligned_xor(void *src, void *dest, int bytes);
|
|||
|
||||
void gf_multby_one(void *src, void *dest, int bytes, int xor)
|
||||
{
|
||||
#ifdef INTEL_SSE2
|
||||
__m128i ms, md;
|
||||
#endif
|
||||
unsigned long uls, uld;
|
||||
uint8_t *s8, *d8;
|
||||
uint64_t *s64, *d64, *dtop64;
|
||||
gf_region_data rd;
|
||||
|
||||
if (!xor) {
|
||||
memcpy(dest, src, bytes);
|
||||
if (dest != src)
|
||||
memcpy(dest, src, bytes);
|
||||
return;
|
||||
}
|
||||
uls = (unsigned long) src;
|
||||
uld = (unsigned long) dest;
|
||||
|
||||
#ifdef INTEL_SSE2
|
||||
int abytes;
|
||||
s8 = (uint8_t *) src;
|
||||
d8 = (uint8_t *) dest;
|
||||
if (uls % 16 == uld % 16) {
|
||||
gf_set_region_data(&rd, NULL, src, dest, bytes, 1, xor, 16);
|
||||
while (s8 != rd.s_start) {
|
||||
*d8 ^= *s8;
|
||||
d8++;
|
||||
s8++;
|
||||
if (gf_cpu_supports_intel_sse2) {
|
||||
__m128i ms, md;
|
||||
int abytes;
|
||||
s8 = (uint8_t *) src;
|
||||
d8 = (uint8_t *) dest;
|
||||
if (uls % 16 == uld % 16) {
|
||||
gf_set_region_data(&rd, NULL, src, dest, bytes, 1, xor, 16);
|
||||
while (s8 != rd.s_start) {
|
||||
*d8 ^= *s8;
|
||||
d8++;
|
||||
s8++;
|
||||
}
|
||||
while (s8 < (uint8_t *) rd.s_top) {
|
||||
ms = _mm_load_si128 ((__m128i *)(s8));
|
||||
md = _mm_load_si128 ((__m128i *)(d8));
|
||||
md = _mm_xor_si128(md, ms);
|
||||
_mm_store_si128((__m128i *)(d8), md);
|
||||
s8 += 16;
|
||||
d8 += 16;
|
||||
}
|
||||
while (s8 != (uint8_t *) src + bytes) {
|
||||
*d8 ^= *s8;
|
||||
d8++;
|
||||
s8++;
|
||||
}
|
||||
return;
|
||||
}
|
||||
while (s8 < (uint8_t *) rd.s_top) {
|
||||
ms = _mm_load_si128 ((__m128i *)(s8));
|
||||
md = _mm_load_si128 ((__m128i *)(d8));
|
||||
|
||||
abytes = (bytes & 0xfffffff0);
|
||||
|
||||
while (d8 < (uint8_t *) dest + abytes) {
|
||||
ms = _mm_loadu_si128 ((__m128i *)(s8));
|
||||
md = _mm_loadu_si128 ((__m128i *)(d8));
|
||||
md = _mm_xor_si128(md, ms);
|
||||
_mm_store_si128((__m128i *)(d8), md);
|
||||
_mm_storeu_si128((__m128i *)(d8), md);
|
||||
s8 += 16;
|
||||
d8 += 16;
|
||||
}
|
||||
while (s8 != (uint8_t *) src + bytes) {
|
||||
while (d8 != (uint8_t *) dest+bytes) {
|
||||
*d8 ^= *s8;
|
||||
d8++;
|
||||
s8++;
|
||||
}
|
||||
return;
|
||||
}
|
||||
|
||||
abytes = (bytes & 0xfffffff0);
|
||||
|
||||
while (d8 < (uint8_t *) dest + abytes) {
|
||||
ms = _mm_loadu_si128 ((__m128i *)(s8));
|
||||
md = _mm_loadu_si128 ((__m128i *)(d8));
|
||||
md = _mm_xor_si128(md, ms);
|
||||
_mm_storeu_si128((__m128i *)(d8), md);
|
||||
s8 += 16;
|
||||
d8 += 16;
|
||||
}
|
||||
while (d8 != (uint8_t *) dest+bytes) {
|
||||
*d8 ^= *s8;
|
||||
d8++;
|
||||
s8++;
|
||||
}
|
||||
return;
|
||||
#endif
|
||||
#if defined(ARM_NEON)
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
s8 = (uint8_t *) src;
|
||||
d8 = (uint8_t *) dest;
|
||||
|
||||
if (uls % 16 == uld % 16) {
|
||||
gf_set_region_data(&rd, NULL, src, dest, bytes, 1, xor, 16);
|
||||
while (s8 != rd.s_start) {
|
||||
*d8 ^= *s8;
|
||||
s8++;
|
||||
d8++;
|
||||
}
|
||||
while (s8 < (uint8_t *) rd.s_top) {
|
||||
uint8x16_t vs = vld1q_u8 (s8);
|
||||
uint8x16_t vd = vld1q_u8 (d8);
|
||||
uint8x16_t vr = veorq_u8 (vs, vd);
|
||||
vst1q_u8 (d8, vr);
|
||||
s8 += 16;
|
||||
d8 += 16;
|
||||
}
|
||||
} else {
|
||||
while (s8 + 15 < (uint8_t *) src + bytes) {
|
||||
uint8x16_t vs = vld1q_u8 (s8);
|
||||
uint8x16_t vd = vld1q_u8 (d8);
|
||||
uint8x16_t vr = veorq_u8 (vs, vd);
|
||||
vst1q_u8 (d8, vr);
|
||||
s8 += 16;
|
||||
d8 += 16;
|
||||
}
|
||||
}
|
||||
while (s8 < (uint8_t *) src + bytes) {
|
||||
*d8 ^= *s8;
|
||||
s8++;
|
||||
d8++;
|
||||
}
|
||||
return;
|
||||
}
|
||||
#endif
|
||||
if (uls % 8 != uld % 8) {
|
||||
gf_unaligned_xor(src, dest, bytes);
|
||||
return;
|
||||
|
|
|
@ -0,0 +1,180 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* gf_cpu.h
|
||||
*
|
||||
* Identifies whether the CPU supports SIMD instructions at runtime.
|
||||
*/
|
||||
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
|
||||
int gf_cpu_identified = 0;
|
||||
|
||||
int gf_cpu_supports_intel_pclmul = 0;
|
||||
int gf_cpu_supports_intel_sse4 = 0;
|
||||
int gf_cpu_supports_intel_ssse3 = 0;
|
||||
int gf_cpu_supports_intel_sse3 = 0;
|
||||
int gf_cpu_supports_intel_sse2 = 0;
|
||||
int gf_cpu_supports_arm_neon = 0;
|
||||
|
||||
#if defined(__x86_64__)
|
||||
|
||||
/* CPUID Feature Bits */
|
||||
|
||||
/* ECX */
|
||||
#define GF_CPU_SSE3 (1 << 0)
|
||||
#define GF_CPU_PCLMUL (1 << 1)
|
||||
#define GF_CPU_SSSE3 (1 << 9)
|
||||
#define GF_CPU_SSE41 (1 << 19)
|
||||
#define GF_CPU_SSE42 (1 << 20)
|
||||
|
||||
/* EDX */
|
||||
#define GF_CPU_SSE2 (1 << 26)
|
||||
|
||||
#if defined(_MSC_VER)
|
||||
|
||||
#define cpuid(info, x) __cpuidex(info, x, 0)
|
||||
|
||||
#elif defined(__GNUC__)
|
||||
|
||||
#include <cpuid.h>
|
||||
void cpuid(int info[4], int InfoType){
|
||||
__cpuid_count(InfoType, 0, info[0], info[1], info[2], info[3]);
|
||||
}
|
||||
|
||||
#else
|
||||
|
||||
#error please add a way to detect CPU SIMD support at runtime
|
||||
|
||||
#endif
|
||||
|
||||
void gf_cpu_identify(void)
|
||||
{
|
||||
if (gf_cpu_identified) {
|
||||
return;
|
||||
}
|
||||
|
||||
int reg[4];
|
||||
|
||||
cpuid(reg, 1);
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
if ((reg[2] & GF_CPU_PCLMUL) != 0 && !getenv("GF_COMPLETE_DISABLE_SSE4_PCLMUL")) {
|
||||
gf_cpu_supports_intel_pclmul = 1;
|
||||
#ifdef DEBUG_CPU_DETECTION
|
||||
printf("#gf_cpu_supports_intel_pclmul\n");
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4)
|
||||
if (((reg[2] & GF_CPU_SSE42) != 0 || (reg[2] & GF_CPU_SSE41) != 0) && !getenv("GF_COMPLETE_DISABLE_SSE4")) {
|
||||
gf_cpu_supports_intel_sse4 = 1;
|
||||
#ifdef DEBUG_CPU_DETECTION
|
||||
printf("#gf_cpu_supports_intel_sse4\n");
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSSE3)
|
||||
if ((reg[2] & GF_CPU_SSSE3) != 0 && !getenv("GF_COMPLETE_DISABLE_SSSE3")) {
|
||||
gf_cpu_supports_intel_ssse3 = 1;
|
||||
#ifdef DEBUG_CPU_DETECTION
|
||||
printf("#gf_cpu_supports_intel_ssse3\n");
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE3)
|
||||
if ((reg[2] & GF_CPU_SSE3) != 0 && !getenv("GF_COMPLETE_DISABLE_SSE3")) {
|
||||
gf_cpu_supports_intel_sse3 = 1;
|
||||
#ifdef DEBUG_CPU_DETECTION
|
||||
printf("#gf_cpu_supports_intel_sse3\n");
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE2)
|
||||
if ((reg[3] & GF_CPU_SSE2) != 0 && !getenv("GF_COMPLETE_DISABLE_SSE2")) {
|
||||
gf_cpu_supports_intel_sse2 = 1;
|
||||
#ifdef DEBUG_CPU_DETECTION
|
||||
printf("#gf_cpu_supports_intel_sse2\n");
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
gf_cpu_identified = 1;
|
||||
}
|
||||
|
||||
#elif defined(__arm__) || defined(__aarch64__)
|
||||
|
||||
#ifdef __linux__
|
||||
|
||||
#include <stdio.h>
|
||||
#include <unistd.h>
|
||||
#include <elf.h>
|
||||
#include <linux/auxvec.h>
|
||||
#include <asm/hwcap.h>
|
||||
#include <fcntl.h>
|
||||
|
||||
unsigned long get_hwcap(unsigned long type) {
|
||||
unsigned long hwcap = 0;
|
||||
int fd = open("/proc/self/auxv", O_RDONLY);
|
||||
if (fd > 0) {
|
||||
Elf32_auxv_t auxv;
|
||||
while (read(fd, &auxv, sizeof(Elf32_auxv_t))) {
|
||||
if (auxv.a_type == type) {
|
||||
hwcap = auxv.a_un.a_val;
|
||||
break;
|
||||
}
|
||||
}
|
||||
close(fd);
|
||||
}
|
||||
|
||||
return hwcap;
|
||||
}
|
||||
|
||||
#endif // linux
|
||||
|
||||
void gf_cpu_identify(void)
|
||||
{
|
||||
if (gf_cpu_identified) {
|
||||
return;
|
||||
}
|
||||
|
||||
#if defined(ARM_NEON)
|
||||
if (!getenv("GF_COMPLETE_DISABLE_NEON")) {
|
||||
#if __linux__ && __arm__
|
||||
gf_cpu_supports_arm_neon = (get_hwcap(AT_HWCAP) & HWCAP_NEON) > 0;
|
||||
#elif __aarch64__
|
||||
// ASIMD is supported on all aarch64 architectures
|
||||
gf_cpu_supports_arm_neon = 1;
|
||||
#else
|
||||
// we assume that NEON is supported if the compiler supports
|
||||
// NEON and we dont have a reliable way to detect runtime support.
|
||||
gf_cpu_supports_arm_neon = 1;
|
||||
#endif
|
||||
|
||||
#ifdef DEBUG_CPU_DETECTION
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
printf("#gf_cpu_supports_arm_neon\n");
|
||||
}
|
||||
#endif
|
||||
}
|
||||
#endif // defined(ARM_NEON)
|
||||
|
||||
gf_cpu_identified = 1;
|
||||
}
|
||||
|
||||
#else // defined(__arm__) || defined(__aarch64__)
|
||||
|
||||
int gf_cpu_identify(void)
|
||||
{
|
||||
gf_cpu_identified = 1;
|
||||
return 0;
|
||||
}
|
||||
|
||||
#endif
|
|
@ -17,6 +17,7 @@
|
|||
#include <string.h>
|
||||
#include <stdlib.h>
|
||||
#include <time.h>
|
||||
#include <assert.h>
|
||||
|
||||
#include "gf_complete.h"
|
||||
#include "gf_int.h"
|
||||
|
@ -136,7 +137,7 @@ int gf_general_s_to_val(gf_general_t *v, int w, char *s, int hex)
|
|||
}
|
||||
if (w == 32) return 1;
|
||||
if (w == 31) {
|
||||
if (v->w32 & (1 << 31)) return 0;
|
||||
if (v->w32 & ((gf_val_32_t)1 << 31)) return 0;
|
||||
return 1;
|
||||
}
|
||||
if (v->w32 & ~((1 << w)-1)) return 0;
|
||||
|
@ -311,7 +312,7 @@ void gf_general_do_region_check(gf_t *gf, gf_general_t *a, void *orig_a, void *o
|
|||
if (xor) fprintf(stderr," XOR with target word: %s\n", sot);
|
||||
fprintf(stderr," Product word: %s\n", sft);
|
||||
fprintf(stderr," It should be: %s\n", ssb);
|
||||
exit(0);
|
||||
assert(0);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
|
@ -47,7 +47,6 @@ int create_gf_from_argv(gf_t *gf, int w, int argc, char **argv, int starting)
|
|||
} else if (strcmp(argv[starting], "CARRY_FREE") == 0) {
|
||||
mult_type = GF_MULT_CARRY_FREE;
|
||||
starting++;
|
||||
//ADAM
|
||||
} else if (strcmp(argv[starting], "CARRY_FREE_GK") == 0) {
|
||||
mult_type = GF_MULT_CARRY_FREE_GK;
|
||||
starting++;
|
||||
|
@ -108,7 +107,6 @@ int create_gf_from_argv(gf_t *gf, int w, int argc, char **argv, int starting)
|
|||
return 0;
|
||||
}
|
||||
} else {
|
||||
if (base != NULL) gf_free(base, 1);
|
||||
_gf_errno = GF_E_UNKNOWN;
|
||||
return 0;
|
||||
}
|
||||
|
@ -123,11 +121,17 @@ int create_gf_from_argv(gf_t *gf, int w, int argc, char **argv, int starting)
|
|||
} else if (strcmp(argv[starting], "LAZY") == 0) {
|
||||
region_type |= GF_REGION_LAZY;
|
||||
starting++;
|
||||
} else if (strcmp(argv[starting], "SIMD") == 0) {
|
||||
region_type |= GF_REGION_SIMD;
|
||||
starting++;
|
||||
} else if (strcmp(argv[starting], "NOSIMD") == 0) {
|
||||
region_type |= GF_REGION_NOSIMD;
|
||||
starting++;
|
||||
} else if (strcmp(argv[starting], "SSE") == 0) {
|
||||
region_type |= GF_REGION_SSE;
|
||||
region_type |= GF_REGION_SIMD;
|
||||
starting++;
|
||||
} else if (strcmp(argv[starting], "NOSSE") == 0) {
|
||||
region_type |= GF_REGION_NOSSE;
|
||||
region_type |= GF_REGION_NOSIMD;
|
||||
starting++;
|
||||
} else if (strcmp(argv[starting], "CAUCHY") == 0) {
|
||||
region_type |= GF_REGION_CAUCHY;
|
||||
|
|
128
src/gf_w128.c
|
@ -11,6 +11,7 @@
|
|||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include "gf_cpu.h"
|
||||
|
||||
#define GF_FIELD_WIDTH (128)
|
||||
|
||||
|
@ -49,7 +50,7 @@ void
|
|||
gf_w128_multiply_region_from_single(gf_t *gf, void *src, void *dest, gf_val_128_t val, int bytes,
|
||||
int xor)
|
||||
{
|
||||
int i;
|
||||
uint32_t i;
|
||||
gf_val_128_t s128;
|
||||
gf_val_128_t d128;
|
||||
uint64_t c128[2];
|
||||
|
@ -87,7 +88,7 @@ void
|
|||
gf_w128_clm_multiply_region_from_single(gf_t *gf, void *src, void *dest, gf_val_128_t val, int bytes,
|
||||
int xor)
|
||||
{
|
||||
int i;
|
||||
uint32_t i;
|
||||
gf_val_128_t s128;
|
||||
gf_val_128_t d128;
|
||||
gf_region_data rd;
|
||||
|
@ -290,11 +291,11 @@ gf_w128_shift_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_12
|
|||
return;
|
||||
}
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
void
|
||||
gf_w128_clm_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_128_t c128)
|
||||
{
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a,b;
|
||||
__m128i result0,result1;
|
||||
__m128i prim_poly;
|
||||
|
@ -338,9 +339,8 @@ gf_w128_clm_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_128_
|
|||
|
||||
c128[0] = (uint64_t)_mm_extract_epi64(result1,1);
|
||||
c128[1] = (uint64_t)_mm_extract_epi64(result1,0);
|
||||
#endif
|
||||
return;
|
||||
}
|
||||
#endif
|
||||
|
||||
void
|
||||
gf_w128_bytwo_p_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_128_t c128)
|
||||
|
@ -376,10 +376,10 @@ gf_w128_bytwo_p_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_
|
|||
return;
|
||||
}
|
||||
|
||||
#if defined(INTEL_SSE4)
|
||||
void
|
||||
gf_w128_sse_bytwo_p_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_128_t c128)
|
||||
{
|
||||
#if defined(INTEL_SSE4)
|
||||
int i;
|
||||
__m128i a, b, pp, prod, amask, u_middle_one;
|
||||
/*John: pmask is always the highest bit set, and the rest zeros. amask changes, it's a countdown.*/
|
||||
|
@ -413,7 +413,7 @@ gf_w128_sse_bytwo_p_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_
|
|||
}
|
||||
amask = _mm_srli_epi64(amask, 1); /*so does this one, but we can just replace after loop*/
|
||||
}
|
||||
amask = _mm_insert_epi32(amask, 1 << 31, 0x1);
|
||||
amask = _mm_insert_epi32(amask, (gf_val_32_t)1 << 31, 0x1);
|
||||
for (i = 64; i < 128; i++) {
|
||||
topbit = (_mm_extract_epi32(prod, 0x3) & pmask);
|
||||
middlebit = (_mm_extract_epi32(prod, 0x1) & pmask);
|
||||
|
@ -427,16 +427,16 @@ gf_w128_sse_bytwo_p_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_
|
|||
}
|
||||
c128[0] = (uint64_t)_mm_extract_epi64(prod, 1);
|
||||
c128[1] = (uint64_t)_mm_extract_epi64(prod, 0);
|
||||
#endif
|
||||
return;
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
/* Ben: This slow function implements sse instrutions for bytwo_b because why not */
|
||||
#if defined(INTEL_SSE4)
|
||||
void
|
||||
gf_w128_sse_bytwo_b_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_128_t c128)
|
||||
{
|
||||
#if defined(INTEL_SSE4)
|
||||
__m128i a, b, lmask, hmask, pp, c, middle_one;
|
||||
gf_internal_t *h;
|
||||
uint64_t topbit, middlebit;
|
||||
|
@ -471,8 +471,8 @@ gf_w128_sse_bytwo_b_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_
|
|||
if (middlebit) b = _mm_xor_si128(b, middle_one);
|
||||
if (topbit) b = _mm_xor_si128(b, pp);
|
||||
}
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
void
|
||||
gf_w128_bytwo_b_multiply(gf_t *gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_128_t c128)
|
||||
|
@ -568,7 +568,6 @@ gf_w128_split_4_128_multiply_region(gf_t *gf, void *src, void *dest, gf_val_128_
|
|||
printf("\n");
|
||||
}
|
||||
*/
|
||||
i = 0;
|
||||
while (d64 < top) {
|
||||
v[0] = (xor) ? d64[0] : 0;
|
||||
v[1] = (xor) ? d64[1] : 0;
|
||||
|
@ -613,7 +612,6 @@ gf_w128_split_4_128_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_
|
|||
}
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
pp = h->prim_poly;
|
||||
|
||||
/* We only do this to check on alignment. */
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, 0, xor, 16);
|
||||
|
@ -713,7 +711,6 @@ gf_w128_split_4_128_sse_altmap_multiply_region(gf_t *gf, void *src, void *dest,
|
|||
}
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
pp = h->prim_poly;
|
||||
|
||||
/* We only do this to check on alignment. */
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, 0, xor, 256);
|
||||
|
@ -1149,7 +1146,7 @@ gf_w128_group_multiply_region(gf_t *gf, void *src, void *dest, gf_val_128_t val,
|
|||
}
|
||||
|
||||
/* a^-1 -> b */
|
||||
void
|
||||
void
|
||||
gf_w128_euclid(GFP gf, gf_val_128_t a128, gf_val_128_t b128)
|
||||
{
|
||||
uint64_t e_i[2], e_im1[2], e_ip1[2];
|
||||
|
@ -1242,7 +1239,7 @@ gf_w128_euclid(GFP gf, gf_val_128_t a128, gf_val_128_t b128)
|
|||
return;
|
||||
}
|
||||
|
||||
void
|
||||
void
|
||||
gf_w128_divide_from_inverse(GFP gf, gf_val_128_t a128, gf_val_128_t b128, gf_val_128_t c128)
|
||||
{
|
||||
uint64_t d[2];
|
||||
|
@ -1251,7 +1248,7 @@ gf_w128_divide_from_inverse(GFP gf, gf_val_128_t a128, gf_val_128_t b128, gf_val
|
|||
return;
|
||||
}
|
||||
|
||||
void
|
||||
void
|
||||
gf_w128_inverse_from_divide(GFP gf, gf_val_128_t a128, gf_val_128_t b128)
|
||||
{
|
||||
uint64_t one128[2];
|
||||
|
@ -1263,7 +1260,7 @@ gf_w128_inverse_from_divide(GFP gf, gf_val_128_t a128, gf_val_128_t b128)
|
|||
|
||||
|
||||
static
|
||||
void
|
||||
void
|
||||
gf_w128_composite_inverse(gf_t *gf, gf_val_128_t a, gf_val_128_t inv)
|
||||
{
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
|
@ -1408,14 +1405,14 @@ int gf_w128_composite_init(gf_t *gf)
|
|||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP) {
|
||||
gf->multiply_region.w128 = gf_w128_composite_multiply_region_alt;
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_composite_multiply_region_alt)
|
||||
} else {
|
||||
gf->multiply_region.w128 = gf_w128_composite_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_composite_multiply_region)
|
||||
}
|
||||
|
||||
gf->multiply.w128 = gf_w128_composite_multiply;
|
||||
gf->divide.w128 = gf_w128_divide_from_inverse;
|
||||
gf->inverse.w128 = gf_w128_composite_inverse;
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_composite_multiply)
|
||||
SET_FUNCTION(gf,divide,w128,gf_w128_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w128,gf_w128_composite_inverse)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -1424,10 +1421,12 @@ static
|
|||
int gf_w128_cfm_init(gf_t *gf)
|
||||
{
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf->inverse.w128 = gf_w128_euclid;
|
||||
gf->multiply.w128 = gf_w128_clm_multiply;
|
||||
gf->multiply_region.w128 = gf_w128_clm_multiply_region_from_single;
|
||||
return 1;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
SET_FUNCTION(gf,inverse,w128,gf_w128_euclid)
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_clm_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_clm_multiply_region_from_single)
|
||||
return 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
return 0;
|
||||
|
@ -1436,9 +1435,9 @@ int gf_w128_cfm_init(gf_t *gf)
|
|||
static
|
||||
int gf_w128_shift_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w128 = gf_w128_shift_multiply;
|
||||
gf->inverse.w128 = gf_w128_euclid;
|
||||
gf->multiply_region.w128 = gf_w128_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_shift_multiply)
|
||||
SET_FUNCTION(gf,inverse,w128,gf_w128_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_multiply_region_from_single)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -1449,16 +1448,16 @@ int gf_w128_bytwo_init(gf_t *gf)
|
|||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if (h->mult_type == GF_MULT_BYTWO_p) {
|
||||
gf->multiply.w128 = gf_w128_bytwo_p_multiply;
|
||||
/*gf->multiply.w128 = gf_w128_sse_bytwo_p_multiply;*/
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_bytwo_p_multiply)
|
||||
/*SET_FUNCTION(gf,multiply,w128,gf_w128_sse_bytwo_p_multiply)*/
|
||||
/* John: the sse function is slower.*/
|
||||
} else {
|
||||
gf->multiply.w128 = gf_w128_bytwo_b_multiply;
|
||||
/*gf->multiply.w128 = gf_w128_sse_bytwo_b_multiply;
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_bytwo_b_multiply)
|
||||
/*SET_FUNCTION(gf,multiply,w128,gf_w128_sse_bytwo_b_multiply)
|
||||
Ben: This sse function is also slower. */
|
||||
}
|
||||
gf->inverse.w128 = gf_w128_euclid;
|
||||
gf->multiply_region.w128 = gf_w128_bytwo_b_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w128,gf_w128_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_bytwo_b_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -1528,20 +1527,20 @@ int gf_w128_split_init(gf_t *gf)
|
|||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
gf->multiply.w128 = gf_w128_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_bytwo_p_multiply)
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
if (!(h->region_type & GF_REGION_NOSSE)){
|
||||
gf->multiply.w128 = gf_w128_clm_multiply;
|
||||
if (gf_cpu_supports_intel_pclmul && !(h->region_type & GF_REGION_NOSIMD)){
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_clm_multiply)
|
||||
}
|
||||
#endif
|
||||
|
||||
gf->inverse.w128 = gf_w128_euclid;
|
||||
SET_FUNCTION(gf,inverse,w128,gf_w128_euclid)
|
||||
|
||||
if ((h->arg1 != 4 && h->arg2 != 4) || h->mult_type == GF_MULT_DEFAULT) {
|
||||
sd8 = (struct gf_w128_split_8_128_data *) h->private;
|
||||
sd8->last_value[0] = 0;
|
||||
sd8->last_value[1] = 0;
|
||||
gf->multiply_region.w128 = gf_w128_split_8_128_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_split_8_128_multiply_region)
|
||||
} else {
|
||||
sd4 = (struct gf_w128_split_4_128_data *) h->private;
|
||||
sd4->last_value[0] = 0;
|
||||
|
@ -1549,23 +1548,19 @@ int gf_w128_split_init(gf_t *gf)
|
|||
if((h->region_type & GF_REGION_ALTMAP))
|
||||
{
|
||||
#ifdef INTEL_SSE4
|
||||
if(!(h->region_type & GF_REGION_NOSSE))
|
||||
gf->multiply_region.w128 = gf_w128_split_4_128_sse_altmap_multiply_region;
|
||||
if(gf_cpu_supports_intel_sse4 && !(h->region_type & GF_REGION_NOSIMD))
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_split_4_128_sse_altmap_multiply_region)
|
||||
else
|
||||
return 0;
|
||||
#else
|
||||
return 0;
|
||||
#endif
|
||||
return 0;
|
||||
}
|
||||
else {
|
||||
#ifdef INTEL_SSE4
|
||||
if(!(h->region_type & GF_REGION_NOSSE))
|
||||
gf->multiply_region.w128 = gf_w128_split_4_128_sse_multiply_region;
|
||||
if(gf_cpu_supports_intel_sse4 && !(h->region_type & GF_REGION_NOSIMD))
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_split_4_128_sse_multiply_region)
|
||||
else
|
||||
gf->multiply_region.w128 = gf_w128_split_4_128_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w128 = gf_w128_split_4_128_multiply_region;
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_split_4_128_multiply_region)
|
||||
}
|
||||
}
|
||||
return 1;
|
||||
|
@ -1589,9 +1584,9 @@ int gf_w128_group_init(gf_t *gf)
|
|||
gt->m_table[2] = 0;
|
||||
gt->m_table[3] = 0;
|
||||
|
||||
gf->multiply.w128 = gf_w128_group_multiply;
|
||||
gf->inverse.w128 = gf_w128_euclid;
|
||||
gf->multiply_region.w128 = gf_w128_group_multiply_region;
|
||||
SET_FUNCTION(gf,multiply,w128,gf_w128_group_multiply)
|
||||
SET_FUNCTION(gf,inverse,w128,gf_w128_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w128,gf_w128_group_multiply_region)
|
||||
|
||||
gf_w128_group_r_init(gf);
|
||||
|
||||
|
@ -1727,7 +1722,6 @@ int gf_w128_scratch_size(int mult_type, int region_type, int divide_type, int ar
|
|||
int gf_w128_init(gf_t *gf)
|
||||
{
|
||||
gf_internal_t *h;
|
||||
int no_default_flag = 0;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
|
@ -1740,16 +1734,12 @@ int gf_w128_init(gf_t *gf)
|
|||
} else {
|
||||
h->prim_poly = 0x87; /* Omitting the leftmost 1 as in w=32 */
|
||||
}
|
||||
if (no_default_flag == 1) {
|
||||
fprintf(stderr,"Code contains no default irreducible polynomial for given base field\n");
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
|
||||
gf->multiply.w128 = NULL;
|
||||
gf->divide.w128 = NULL;
|
||||
gf->inverse.w128 = NULL;
|
||||
gf->multiply_region.w128 = NULL;
|
||||
SET_FUNCTION(gf,multiply,w128,NULL)
|
||||
SET_FUNCTION(gf,divide,w128,NULL)
|
||||
SET_FUNCTION(gf,inverse,w128,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w128,NULL)
|
||||
switch(h->mult_type) {
|
||||
case GF_MULT_BYTWO_p:
|
||||
case GF_MULT_BYTWO_b: if (gf_w128_bytwo_init(gf) == 0) return 0; break;
|
||||
|
@ -1765,22 +1755,22 @@ int gf_w128_init(gf_t *gf)
|
|||
/* Ben: Used to be h->region_type == GF_REGION_ALTMAP, but failed since there
|
||||
are multiple flags in h->region_type */
|
||||
if (h->mult_type == GF_MULT_SPLIT_TABLE && (h->region_type & GF_REGION_ALTMAP)) {
|
||||
gf->extract_word.w128 = gf_w128_split_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w128,gf_w128_split_extract_word)
|
||||
} else if (h->mult_type == GF_MULT_COMPOSITE && h->region_type == GF_REGION_ALTMAP) {
|
||||
gf->extract_word.w128 = gf_w128_composite_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w128,gf_w128_composite_extract_word)
|
||||
} else {
|
||||
gf->extract_word.w128 = gf_w128_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w128,gf_w128_extract_word)
|
||||
}
|
||||
|
||||
if (h->divide_type == GF_DIVIDE_EUCLID) {
|
||||
gf->divide.w128 = gf_w128_divide_from_inverse;
|
||||
SET_FUNCTION(gf,divide,w128,gf_w128_divide_from_inverse)
|
||||
}
|
||||
|
||||
if (gf->inverse.w128 != NULL && gf->divide.w128 == NULL) {
|
||||
gf->divide.w128 = gf_w128_divide_from_inverse;
|
||||
SET_FUNCTION(gf,divide,w128,gf_w128_divide_from_inverse)
|
||||
}
|
||||
if (gf->inverse.w128 == NULL && gf->divide.w128 != NULL) {
|
||||
gf->inverse.w128 = gf_w128_inverse_from_divide;
|
||||
SET_FUNCTION(gf,inverse,w128,gf_w128_inverse_from_divide)
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
|
289
src/gf_w16.c
|
@ -11,54 +11,8 @@
|
|||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (16)
|
||||
#define GF_FIELD_SIZE (1 << GF_FIELD_WIDTH)
|
||||
#define GF_MULT_GROUP_SIZE GF_FIELD_SIZE-1
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (8)
|
||||
#define GF_BASE_FIELD_SIZE (1 << GF_BASE_FIELD_WIDTH)
|
||||
|
||||
struct gf_w16_logtable_data {
|
||||
uint16_t log_tbl[GF_FIELD_SIZE];
|
||||
uint16_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint16_t inv_tbl[GF_FIELD_SIZE];
|
||||
uint16_t *d_antilog;
|
||||
};
|
||||
|
||||
struct gf_w16_zero_logtable_data {
|
||||
int log_tbl[GF_FIELD_SIZE];
|
||||
uint16_t _antilog_tbl[GF_FIELD_SIZE * 4];
|
||||
uint16_t *antilog_tbl;
|
||||
uint16_t inv_tbl[GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w16_lazytable_data {
|
||||
uint16_t log_tbl[GF_FIELD_SIZE];
|
||||
uint16_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint16_t inv_tbl[GF_FIELD_SIZE];
|
||||
uint16_t *d_antilog;
|
||||
uint16_t lazytable[GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w16_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
|
||||
struct gf_w16_split_8_8_data {
|
||||
uint16_t tables[3][256][256];
|
||||
};
|
||||
|
||||
struct gf_w16_group_4_4_data {
|
||||
uint16_t reduce[16];
|
||||
uint16_t shift[16];
|
||||
};
|
||||
|
||||
struct gf_w16_composite_data {
|
||||
uint8_t *mult_table;
|
||||
};
|
||||
#include "gf_w16.h"
|
||||
#include "gf_cpu.h"
|
||||
|
||||
#define AB2(ip, am1 ,am2, b, t1, t2) {\
|
||||
t1 = (b << 1) & am1;\
|
||||
|
@ -438,6 +392,7 @@ gf_val_32_t gf_w16_matrix (gf_t *gf, gf_val_32_t b)
|
|||
extra memory.
|
||||
*/
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -445,8 +400,6 @@ gf_w16_clm_multiply_2 (gf_t *gf, gf_val_32_t a16, gf_val_32_t b16)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -480,11 +433,11 @@ gf_w16_clm_multiply_2 (gf_t *gf, gf_val_32_t a16, gf_val_32_t b16)
|
|||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
|
||||
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -492,8 +445,6 @@ gf_w16_clm_multiply_3 (gf_t *gf, gf_val_32_t a16, gf_val_32_t b16)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -520,11 +471,11 @@ gf_w16_clm_multiply_3 (gf_t *gf, gf_val_32_t a16, gf_val_32_t b16)
|
|||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
|
||||
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -532,8 +483,6 @@ gf_w16_clm_multiply_4 (gf_t *gf, gf_val_32_t a16, gf_val_32_t b16)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -562,10 +511,9 @@ gf_w16_clm_multiply_4 (gf_t *gf, gf_val_32_t a16, gf_val_32_t b16)
|
|||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
|
||||
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
static
|
||||
|
@ -595,7 +543,7 @@ gf_w16_shift_multiply (gf_t *gf, gf_val_32_t a16, gf_val_32_t b16)
|
|||
static
|
||||
int gf_w16_shift_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w32 = gf_w16_shift_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_shift_multiply)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -603,25 +551,27 @@ static
|
|||
int gf_w16_cfm_init(gf_t *gf)
|
||||
{
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf_internal_t *h;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
gf_internal_t *h;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
/*Ben: Determining how many reductions to do */
|
||||
|
||||
if ((0xfe00 & h->prim_poly) == 0) {
|
||||
gf->multiply.w32 = gf_w16_clm_multiply_2;
|
||||
gf->multiply_region.w32 = gf_w16_clm_multiply_region_from_single_2;
|
||||
} else if((0xf000 & h->prim_poly) == 0) {
|
||||
gf->multiply.w32 = gf_w16_clm_multiply_3;
|
||||
gf->multiply_region.w32 = gf_w16_clm_multiply_region_from_single_3;
|
||||
} else if ((0xe000 & h->prim_poly) == 0) {
|
||||
gf->multiply.w32 = gf_w16_clm_multiply_4;
|
||||
gf->multiply_region.w32 = gf_w16_clm_multiply_region_from_single_4;
|
||||
} else {
|
||||
return 0;
|
||||
}
|
||||
return 1;
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
/*Ben: Determining how many reductions to do */
|
||||
|
||||
if ((0xfe00 & h->prim_poly) == 0) {
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_clm_multiply_2)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_clm_multiply_region_from_single_2)
|
||||
} else if((0xf000 & h->prim_poly) == 0) {
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_clm_multiply_3)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_clm_multiply_region_from_single_3)
|
||||
} else if ((0xe000 & h->prim_poly) == 0) {
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_clm_multiply_4)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_clm_multiply_region_from_single_4)
|
||||
} else {
|
||||
return 0;
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
return 0;
|
||||
|
@ -735,10 +685,9 @@ int gf_w16_log_init(gf_t *gf)
|
|||
|
||||
if (check) {
|
||||
if (h->mult_type != GF_MULT_LOG_TABLE) {
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
return gf_w16_cfm_init(gf);
|
||||
#endif
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
return gf_w16_cfm_init(gf);
|
||||
}
|
||||
return gf_w16_shift_init(gf);
|
||||
} else {
|
||||
_gf_errno = GF_E_LOGPOLY;
|
||||
|
@ -752,10 +701,10 @@ int gf_w16_log_init(gf_t *gf)
|
|||
ltd->inv_tbl[i] = ltd->antilog_tbl[GF_MULT_GROUP_SIZE-ltd->log_tbl[i]];
|
||||
}
|
||||
|
||||
gf->inverse.w32 = gf_w16_log_inverse;
|
||||
gf->divide.w32 = gf_w16_log_divide;
|
||||
gf->multiply.w32 = gf_w16_log_multiply;
|
||||
gf->multiply_region.w32 = gf_w16_log_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w16_log_inverse)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w16_log_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_log_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_log_multiply_region)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -995,11 +944,11 @@ gf_w16_table_lazy_multiply_region(gf_t *gf, void *src, void *dest, gf_val_32_t v
|
|||
gf_do_final_region_alignment(&rd);
|
||||
}
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
static
|
||||
void
|
||||
gf_w16_split_4_16_lazy_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
#ifdef INTEL_SSSE3
|
||||
uint64_t i, j, *s64, *d64, *top64;;
|
||||
uint64_t c, prod;
|
||||
uint8_t low[4][16];
|
||||
|
@ -1125,14 +1074,14 @@ gf_w16_split_4_16_lazy_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_v
|
|||
}
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
static
|
||||
void
|
||||
gf_w16_split_4_16_lazy_sse_altmap_multiply_region(gf_t *gf, void *src, void *dest, gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
#ifdef INTEL_SSSE3
|
||||
uint64_t i, j, *s64, *d64, *top64;;
|
||||
uint64_t c, prod;
|
||||
uint8_t low[4][16];
|
||||
|
@ -1234,8 +1183,8 @@ gf_w16_split_4_16_lazy_sse_altmap_multiply_region(gf_t *gf, void *src, void *des
|
|||
}
|
||||
gf_do_final_region_alignment(&rd);
|
||||
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
uint32_t
|
||||
gf_w16_split_8_8_multiply(gf_t *gf, gf_val_32_t a, gf_val_32_t b)
|
||||
|
@ -1263,16 +1212,11 @@ int gf_w16_split_init(gf_t *gf)
|
|||
{
|
||||
gf_internal_t *h;
|
||||
struct gf_w16_split_8_8_data *d8;
|
||||
int i, j, exp, issse3;
|
||||
uint32_t p, basep;
|
||||
int i, j, exp;
|
||||
uint32_t p, basep, tmp;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
issse3 = 0;
|
||||
#ifdef INTEL_SSSE3
|
||||
issse3 = 1;
|
||||
#endif
|
||||
|
||||
if (h->arg1 == 8 && h->arg2 == 8) {
|
||||
d8 = (struct gf_w16_split_8_8_data *) h->private;
|
||||
basep = 1;
|
||||
|
@ -1295,14 +1239,15 @@ issse3 = 0;
|
|||
if (j&1) {
|
||||
d8->tables[exp][i][j] = d8->tables[exp][i][j^1] ^ p;
|
||||
} else {
|
||||
d8->tables[exp][i][j] = GF_MULTBY_TWO(d8->tables[exp][i][j>>1]);
|
||||
tmp = d8->tables[exp][i][j>>1];
|
||||
d8->tables[exp][i][j] = GF_MULTBY_TWO(tmp);
|
||||
}
|
||||
}
|
||||
}
|
||||
for (i = 0; i < 8; i++) basep = GF_MULTBY_TWO(basep);
|
||||
}
|
||||
gf->multiply.w32 = gf_w16_split_8_8_multiply;
|
||||
gf->multiply_region.w32 = gf_w16_split_8_16_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_split_8_8_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_8_16_lazy_multiply_region)
|
||||
return 1;
|
||||
|
||||
}
|
||||
|
@ -1314,32 +1259,45 @@ issse3 = 0;
|
|||
|
||||
/* Defaults */
|
||||
|
||||
if (issse3) {
|
||||
gf->multiply_region.w32 = gf_w16_split_4_16_lazy_sse_multiply_region;
|
||||
#ifdef INTEL_SSSE3
|
||||
if (gf_cpu_supports_intel_ssse3) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_sse_multiply_region)
|
||||
} else {
|
||||
gf->multiply_region.w32 = gf_w16_split_8_16_lazy_multiply_region;
|
||||
#elif ARM_NEON
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
gf_w16_neon_split_init(gf);
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_8_16_lazy_multiply_region)
|
||||
#if defined(INTEL_SSSE3) || defined(ARM_NEON)
|
||||
}
|
||||
|
||||
#endif
|
||||
|
||||
if ((h->arg1 == 8 && h->arg2 == 16) || (h->arg2 == 8 && h->arg1 == 16)) {
|
||||
gf->multiply_region.w32 = gf_w16_split_8_16_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_8_16_lazy_multiply_region)
|
||||
|
||||
} else if ((h->arg1 == 4 && h->arg2 == 16) || (h->arg2 == 4 && h->arg1 == 16)) {
|
||||
if (issse3) {
|
||||
if(h->region_type & GF_REGION_ALTMAP && h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w16_split_4_16_lazy_nosse_altmap_multiply_region;
|
||||
else if(h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w16_split_4_16_lazy_multiply_region;
|
||||
else if(h->region_type & GF_REGION_ALTMAP)
|
||||
gf->multiply_region.w32 = gf_w16_split_4_16_lazy_sse_altmap_multiply_region;
|
||||
#if defined(INTEL_SSSE3) || defined(ARM_NEON)
|
||||
if (gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon) {
|
||||
if(h->region_type & GF_REGION_ALTMAP && h->region_type & GF_REGION_NOSIMD)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_nosse_altmap_multiply_region)
|
||||
else if(h->region_type & GF_REGION_NOSIMD)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_multiply_region)
|
||||
#if defined(INTEL_SSSE3)
|
||||
else if(h->region_type & GF_REGION_ALTMAP && gf_cpu_supports_intel_ssse3)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_sse_altmap_multiply_region)
|
||||
#endif
|
||||
} else {
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
#endif
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
else if(h->region_type & GF_REGION_ALTMAP)
|
||||
gf->multiply_region.w32 = gf_w16_split_4_16_lazy_nosse_altmap_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_nosse_altmap_multiply_region)
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w16_split_4_16_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_multiply_region)
|
||||
#if defined(INTEL_SSSE3) || defined(ARM_NEON)
|
||||
}
|
||||
#endif
|
||||
}
|
||||
|
||||
return 1;
|
||||
|
@ -1350,7 +1308,7 @@ int gf_w16_table_init(gf_t *gf)
|
|||
{
|
||||
gf_w16_log_init(gf);
|
||||
|
||||
gf->multiply_region.w32 = gf_w16_table_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_table_lazy_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -1881,28 +1839,30 @@ int gf_w16_bytwo_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (h->mult_type == GF_MULT_BYTWO_p) {
|
||||
gf->multiply.w32 = gf_w16_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_bytwo_p_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w16_bytwo_p_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w16_bytwo_p_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w16_bytwo_p_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_bytwo_p_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_bytwo_p_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w16_bytwo_b_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_bytwo_b_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w16_bytwo_b_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w16_bytwo_b_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w16_bytwo_b_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_bytwo_b_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_bytwo_b_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
}
|
||||
|
||||
|
@ -1941,10 +1901,10 @@ int gf_w16_log_zero_init(gf_t *gf)
|
|||
ltd->inv_tbl[i] = ltd->antilog_tbl[GF_MULT_GROUP_SIZE-ltd->log_tbl[i]];
|
||||
}
|
||||
|
||||
gf->inverse.w32 = gf_w16_log_zero_inverse;
|
||||
gf->divide.w32 = gf_w16_log_zero_divide;
|
||||
gf->multiply.w32 = gf_w16_log_zero_multiply;
|
||||
gf->multiply_region.w32 = gf_w16_log_zero_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w16_log_zero_inverse)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w16_log_zero_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_log_zero_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_log_zero_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -2182,18 +2142,18 @@ int gf_w16_composite_init(gf_t *gf)
|
|||
cd->mult_table = gf_w8_get_mult_table(h->base_gf);
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP) {
|
||||
gf->multiply_region.w32 = gf_w16_composite_multiply_region_alt;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_composite_multiply_region_alt)
|
||||
} else {
|
||||
gf->multiply_region.w32 = gf_w16_composite_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_composite_multiply_region)
|
||||
}
|
||||
|
||||
if (cd->mult_table == NULL) {
|
||||
gf->multiply.w32 = gf_w16_composite_multiply_recursive;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_composite_multiply_recursive)
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w16_composite_multiply_inline;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_composite_multiply_inline)
|
||||
}
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = gf_w16_composite_inverse;
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w16_composite_inverse)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -2270,7 +2230,6 @@ void gf_w16_group_4_4_region_multiply(gf_t *gf, void *src, void *dest, gf_val_32
|
|||
top = (uint16_t *) rd.d_top;
|
||||
|
||||
while (d16 < top) {
|
||||
p = 0;
|
||||
a16 = *s16;
|
||||
p16 = (xor) ? *d16 : 0;
|
||||
ind = a16 >> 12;
|
||||
|
@ -2315,10 +2274,10 @@ int gf_w16_group_init(gf_t *gf)
|
|||
d44->reduce[p>>16] = (p&0xffff);
|
||||
}
|
||||
|
||||
gf->multiply.w32 = gf_w16_group_4_4_multiply;
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->multiply_region.w32 = gf_w16_group_4_4_region_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w16_group_4_4_multiply)
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_group_4_4_region_multiply)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -2398,10 +2357,10 @@ int gf_w16_init(gf_t *gf)
|
|||
|
||||
if (h->mult_type != GF_MULT_COMPOSITE) h->prim_poly |= (1 << 16);
|
||||
|
||||
gf->multiply.w32 = NULL;
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->multiply_region.w32 = NULL;
|
||||
SET_FUNCTION(gf,multiply,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w32,NULL)
|
||||
|
||||
switch(h->mult_type) {
|
||||
case GF_MULT_LOG_ZERO: if (gf_w16_log_zero_init(gf) == 0) return 0; break;
|
||||
|
@ -2418,34 +2377,34 @@ int gf_w16_init(gf_t *gf)
|
|||
default: return 0;
|
||||
}
|
||||
if (h->divide_type == GF_DIVIDE_EUCLID) {
|
||||
gf->divide.w32 = gf_w16_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w16_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w16_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w16_euclid)
|
||||
} else if (h->divide_type == GF_DIVIDE_MATRIX) {
|
||||
gf->divide.w32 = gf_w16_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w16_matrix;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w16_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w16_matrix)
|
||||
}
|
||||
|
||||
if (gf->divide.w32 == NULL) {
|
||||
gf->divide.w32 = gf_w16_divide_from_inverse;
|
||||
if (gf->inverse.w32 == NULL) gf->inverse.w32 = gf_w16_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w16_divide_from_inverse)
|
||||
if (gf->inverse.w32 == NULL) SET_FUNCTION(gf,inverse,w32,gf_w16_euclid)
|
||||
}
|
||||
|
||||
if (gf->inverse.w32 == NULL) gf->inverse.w32 = gf_w16_inverse_from_divide;
|
||||
if (gf->inverse.w32 == NULL) SET_FUNCTION(gf,inverse,w32,gf_w16_inverse_from_divide)
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP) {
|
||||
if (h->mult_type == GF_MULT_COMPOSITE) {
|
||||
gf->extract_word.w32 = gf_w16_composite_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w16_composite_extract_word)
|
||||
} else {
|
||||
gf->extract_word.w32 = gf_w16_split_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w16_split_extract_word)
|
||||
}
|
||||
} else if (h->region_type == GF_REGION_CAUCHY) {
|
||||
gf->multiply_region.w32 = gf_wgen_cauchy_region;
|
||||
gf->extract_word.w32 = gf_wgen_extract_word;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_wgen_cauchy_region)
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_wgen_extract_word)
|
||||
} else {
|
||||
gf->extract_word.w32 = gf_w16_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w16_extract_word)
|
||||
}
|
||||
if (gf->multiply_region.w32 == NULL) {
|
||||
gf->multiply_region.w32 = gf_w16_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_multiply_region_from_single)
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
|
379
src/gf_w32.c
|
@ -12,59 +12,8 @@
|
|||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (32)
|
||||
#define GF_FIRST_BIT (1 << 31)
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (16)
|
||||
#define GF_BASE_FIELD_SIZE (1 << GF_BASE_FIELD_WIDTH)
|
||||
#define GF_BASE_FIELD_GROUP_SIZE GF_BASE_FIELD_SIZE-1
|
||||
#define GF_MULTBY_TWO(p) (((p) & GF_FIRST_BIT) ? (((p) << 1) ^ h->prim_poly) : (p) << 1)
|
||||
|
||||
struct gf_split_2_32_lazy_data {
|
||||
uint32_t tables[16][4];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_w32_split_8_8_data {
|
||||
uint32_t tables[7][256][256];
|
||||
uint32_t region_tables[4][256];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_w32_group_data {
|
||||
uint32_t *reduce;
|
||||
uint32_t *shift;
|
||||
int tshift;
|
||||
uint64_t rmask;
|
||||
uint32_t *memory;
|
||||
};
|
||||
|
||||
struct gf_split_16_32_lazy_data {
|
||||
uint32_t tables[2][(1<<16)];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_8_32_lazy_data {
|
||||
uint32_t tables[4][256];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_4_32_lazy_data {
|
||||
uint32_t tables[8][16];
|
||||
uint32_t last_value;
|
||||
};
|
||||
|
||||
struct gf_w32_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
|
||||
struct gf_w32_composite_data {
|
||||
uint16_t *log;
|
||||
uint16_t *alog;
|
||||
};
|
||||
#include "gf_w32.h"
|
||||
#include "gf_cpu.h"
|
||||
|
||||
#define MM_PRINT32(s, r) { uint8_t blah[16], ii; printf("%-12s", s); _mm_storeu_si128((__m128i *)blah, r); for (ii = 0; ii < 16; ii += 4) printf(" %02x%02x%02x%02x", blah[15-ii], blah[14-ii], blah[13-ii], blah[12-ii]); printf("\n"); }
|
||||
|
||||
|
@ -102,7 +51,7 @@ void
|
|||
gf_w32_multiply_region_from_single(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int
|
||||
xor)
|
||||
{
|
||||
int i;
|
||||
uint32_t i;
|
||||
uint32_t *s32;
|
||||
uint32_t *d32;
|
||||
|
||||
|
@ -127,7 +76,7 @@ void
|
|||
gf_w32_clm_multiply_region_from_single_2(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int xor)
|
||||
{
|
||||
|
||||
int i;
|
||||
uint32_t i;
|
||||
uint32_t *s32;
|
||||
uint32_t *d32;
|
||||
|
||||
|
@ -177,7 +126,7 @@ void
|
|||
gf_w32_clm_multiply_region_from_single_3(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int xor)
|
||||
{
|
||||
|
||||
int i;
|
||||
uint32_t i;
|
||||
uint32_t *s32;
|
||||
uint32_t *d32;
|
||||
|
||||
|
@ -230,7 +179,7 @@ static
|
|||
void
|
||||
gf_w32_clm_multiply_region_from_single_4(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int xor)
|
||||
{
|
||||
int i;
|
||||
uint32_t i;
|
||||
uint32_t *s32;
|
||||
uint32_t *d32;
|
||||
|
||||
|
@ -399,7 +348,8 @@ uint32_t gf_w32_matrix (gf_t *gf, uint32_t b)
|
|||
extra memory.
|
||||
*/
|
||||
|
||||
//ADAM
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -407,8 +357,6 @@ gf_w32_cfmgk_multiply (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i w;
|
||||
|
@ -431,11 +379,10 @@ gf_w32_cfmgk_multiply (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
|
||||
/* Extracts 32 bit value from result. */
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
//ADAM
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
static
|
||||
|
@ -443,7 +390,7 @@ void
|
|||
gf_w32_cfmgk_multiply_region_from_single(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int xor)
|
||||
{
|
||||
|
||||
int i;
|
||||
uint32_t i;
|
||||
uint32_t *s32;
|
||||
uint32_t *d32;
|
||||
|
||||
|
@ -460,9 +407,9 @@ gf_w32_cfmgk_multiply_region_from_single(gf_t *gf, void *src, void *dest, uint32
|
|||
q_plus = *(uint64_t *) h->private;
|
||||
g_star = *((uint64_t *) h->private + 1);
|
||||
|
||||
a = _mm_insert_epi32 (_mm_setzero_si128(), val, 0);
|
||||
g = _mm_insert_epi64 (a, g_star, 0);
|
||||
q = _mm_insert_epi64 (a, q_plus, 0);
|
||||
a = _mm_insert_epi32 (_mm_setzero_si128(), val, 0);
|
||||
s32 = (uint32_t *) src;
|
||||
d32 = (uint32_t *) dest;
|
||||
|
||||
|
@ -489,6 +436,8 @@ gf_w32_cfmgk_multiply_region_from_single(gf_t *gf, void *src, void *dest, uint32
|
|||
#endif
|
||||
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -496,8 +445,6 @@ gf_w32_clm_multiply_2 (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -530,9 +477,11 @@ gf_w32_clm_multiply_2 (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
|
||||
/* Extracts 32 bit value from result. */
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
static
|
||||
inline
|
||||
|
@ -541,8 +490,6 @@ gf_w32_clm_multiply_3 (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -569,9 +516,11 @@ gf_w32_clm_multiply_3 (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
/* Extracts 32 bit value from result. */
|
||||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
static
|
||||
inline
|
||||
|
@ -580,8 +529,6 @@ gf_w32_clm_multiply_4 (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -610,9 +557,9 @@ gf_w32_clm_multiply_4 (gf_t *gf, gf_val_32_t a32, gf_val_32_t b32)
|
|||
/* Extracts 32 bit value from result. */
|
||||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
static
|
||||
|
@ -640,40 +587,38 @@ gf_w32_shift_multiply (gf_t *gf, uint32_t a32, uint32_t b32)
|
|||
return product;
|
||||
}
|
||||
|
||||
//ADAM
|
||||
static
|
||||
int gf_w32_cfmgk_init(gf_t *gf)
|
||||
{
|
||||
gf->inverse.w32 = gf_w32_euclid;
|
||||
gf->multiply_region.w32 = gf_w32_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_multiply_region_from_single)
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf_internal_t *h;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
gf_internal_t *h;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
gf->multiply.w32 = gf_w32_cfmgk_multiply;
|
||||
gf->multiply_region.w32 = gf_w32_cfmgk_multiply_region_from_single;
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_cfmgk_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_cfmgk_multiply_region_from_single)
|
||||
|
||||
//setup in the private section the q+ and g* ADAM
|
||||
uint64_t *q_plus = (uint64_t *) h->private;
|
||||
uint64_t *g_star = (uint64_t *) h->private + 1;
|
||||
uint64_t *q_plus = (uint64_t *) h->private;
|
||||
uint64_t *g_star = (uint64_t *) h->private + 1;
|
||||
|
||||
//q+
|
||||
uint64_t tmp = h->prim_poly << 32;
|
||||
*q_plus = 1ULL << 32;
|
||||
uint64_t tmp = h->prim_poly << 32;
|
||||
*q_plus = 1ULL << 32;
|
||||
|
||||
int i;
|
||||
for(i = 63; i >= 32; i--)
|
||||
if((1ULL << i) & tmp)
|
||||
{
|
||||
*q_plus |= 1ULL << (i-32);
|
||||
tmp ^= h->prim_poly << (i-32);
|
||||
}
|
||||
int i;
|
||||
for(i = 63; i >= 32; i--)
|
||||
if((1ULL << i) & tmp)
|
||||
{
|
||||
*q_plus |= 1ULL << (i-32);
|
||||
tmp ^= h->prim_poly << (i-32);
|
||||
}
|
||||
|
||||
//g*
|
||||
*g_star = h->prim_poly & ((1ULL << 32) - 1);
|
||||
*g_star = h->prim_poly & ((1ULL << 32) - 1);
|
||||
|
||||
return 1;
|
||||
return 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
return 0;
|
||||
|
@ -682,30 +627,32 @@ int gf_w32_cfmgk_init(gf_t *gf)
|
|||
static
|
||||
int gf_w32_cfm_init(gf_t *gf)
|
||||
{
|
||||
gf->inverse.w32 = gf_w32_euclid;
|
||||
gf->multiply_region.w32 = gf_w32_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_multiply_region_from_single)
|
||||
|
||||
/*Ben: We also check to see if the prim poly will work for pclmul */
|
||||
/*Ben: Check to see how many reduction steps it will take*/
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf_internal_t *h;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
gf_internal_t *h;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if ((0xfffe0000 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w32_clm_multiply_2;
|
||||
gf->multiply_region.w32 = gf_w32_clm_multiply_region_from_single_2;
|
||||
}else if ((0xffc00000 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w32_clm_multiply_3;
|
||||
gf->multiply_region.w32 = gf_w32_clm_multiply_region_from_single_3;
|
||||
}else if ((0xfe000000 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w32_clm_multiply_4;
|
||||
gf->multiply_region.w32 = gf_w32_clm_multiply_region_from_single_4;
|
||||
} else {
|
||||
return 0;
|
||||
if ((0xfffe0000 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_clm_multiply_2)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_clm_multiply_region_from_single_2)
|
||||
}else if ((0xffc00000 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_clm_multiply_3)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_clm_multiply_region_from_single_3)
|
||||
}else if ((0xfe000000 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_clm_multiply_4)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_clm_multiply_region_from_single_4)
|
||||
} else {
|
||||
return 0;
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
return 1;
|
||||
#endif
|
||||
|
||||
return 0;
|
||||
|
@ -714,9 +661,9 @@ int gf_w32_cfm_init(gf_t *gf)
|
|||
static
|
||||
int gf_w32_shift_init(gf_t *gf)
|
||||
{
|
||||
gf->inverse.w32 = gf_w32_euclid;
|
||||
gf->multiply_region.w32 = gf_w32_multiply_region_from_single;
|
||||
gf->multiply.w32 = gf_w32_shift_multiply;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_multiply_region_from_single)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_shift_multiply)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -724,12 +671,12 @@ static
|
|||
void
|
||||
gf_w32_group_set_shift_tables(uint32_t *shift, uint32_t val, gf_internal_t *h)
|
||||
{
|
||||
int i;
|
||||
uint32_t i;
|
||||
uint32_t j;
|
||||
|
||||
shift[0] = 0;
|
||||
|
||||
for (i = 1; i < (1 << h->arg1); i <<= 1) {
|
||||
for (i = 1; i < ((uint32_t)1 << h->arg1); i <<= 1) {
|
||||
for (j = 0; j < i; j++) shift[i|j] = shift[j]^val;
|
||||
if (val & GF_FIRST_BIT) {
|
||||
val <<= 1;
|
||||
|
@ -914,7 +861,6 @@ gf_w32_group_4_4_multiply(gf_t *gf, gf_val_32_t a, gf_val_32_t b)
|
|||
d44 = (struct gf_w32_group_data *) h->private;
|
||||
gf_w32_group_set_shift_tables(d44->shift, b, h);
|
||||
|
||||
p = 0;
|
||||
a32 = a;
|
||||
ind = a32 >> 28;
|
||||
a32 <<= 4;
|
||||
|
@ -1133,7 +1079,7 @@ gf_w32_bytwo_p_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_32_t
|
|||
vrev = 0;
|
||||
for (i = 0; i < 32; i++) {
|
||||
vrev <<= 1;
|
||||
if (!(val & (1 << i))) vrev |= 1;
|
||||
if (!(val & ((gf_val_32_t)1 << i))) vrev |= 1;
|
||||
}
|
||||
|
||||
s8 = (uint8_t *) rd.s_start;
|
||||
|
@ -1439,32 +1385,34 @@ int gf_w32_bytwo_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (h->mult_type == GF_MULT_BYTWO_p) {
|
||||
gf->multiply.w32 = gf_w32_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_bytwo_p_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w32_bytwo_p_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w32_bytwo_p_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w32_bytwo_p_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
return 0;
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_bytwo_p_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_bytwo_p_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w32_bytwo_b_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_bytwo_b_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w32_bytwo_b_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w32_bytwo_b_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w32_bytwo_b_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_bytwo_b_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_bytwo_b_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
}
|
||||
|
||||
gf->inverse.w32 = gf_w32_euclid;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_euclid)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -1609,7 +1557,7 @@ gf_w32_split_16_32_lazy_multiply_region(gf_t *gf, void *src, void *dest, uint32_
|
|||
p = (xor) ? *d32 : 0;
|
||||
a = *s32;
|
||||
i = 0;
|
||||
while (a != 0) {
|
||||
while (a != 0 && i < 2) {
|
||||
v = (a & 0xffff);
|
||||
p ^= t[i][v];
|
||||
a >>= 16;
|
||||
|
@ -1745,7 +1693,6 @@ gf_w32_split_2_32_lazy_sse_multiply_region(gf_t *gf, void *src, void *dest, uint
|
|||
xi = _mm_and_si128(si, mask2);
|
||||
xi = _mm_xor_si128(xi, adder);
|
||||
pi = _mm_xor_si128(pi, _mm_shuffle_epi8(tables[tindex], xi));
|
||||
si = _mm_srli_epi16(si, 2);
|
||||
tindex++;
|
||||
|
||||
vi = _mm_srli_epi32(vi, 8);
|
||||
|
@ -1815,11 +1762,11 @@ gf_w32_split_4_32_lazy_multiply_region(gf_t *gf, void *src, void *dest, uint32_t
|
|||
gf_do_final_region_alignment(&rd);
|
||||
}
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
static
|
||||
void
|
||||
gf_w32_split_4_32_lazy_sse_altmap_multiply_region(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int xor)
|
||||
{
|
||||
#ifdef INTEL_SSSE3
|
||||
gf_internal_t *h;
|
||||
int i, j, k;
|
||||
uint32_t pp, v, *s32, *d32, *top;
|
||||
|
@ -2002,16 +1949,15 @@ gf_w32_split_4_32_lazy_sse_altmap_multiply_region(gf_t *gf, void *src, void *des
|
|||
}
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
static
|
||||
void
|
||||
gf_w32_split_4_32_lazy_sse_multiply_region(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int xor)
|
||||
{
|
||||
#ifdef INTEL_SSSE3
|
||||
gf_internal_t *h;
|
||||
int i, j, k;
|
||||
uint32_t pp, v, *s32, *d32, *top, tmp_table[16];
|
||||
|
@ -2206,11 +2152,6 @@ gf_w32_split_4_32_lazy_sse_multiply_region(gf_t *gf, void *src, void *dest, uint
|
|||
v2 = _mm_packus_epi16(tv2, tv0);
|
||||
v3 = _mm_packus_epi16(tv3, tv1);
|
||||
|
||||
p0 = v0;
|
||||
p1 = v1;
|
||||
p2 = v2;
|
||||
p3 = v3;
|
||||
|
||||
si = _mm_and_si128(v0, mask1);
|
||||
p0 = _mm_shuffle_epi8(tables[6][0], si);
|
||||
p1 = _mm_shuffle_epi8(tables[6][1], si);
|
||||
|
@ -2281,9 +2222,8 @@ gf_w32_split_4_32_lazy_sse_multiply_region(gf_t *gf, void *src, void *dest, uint
|
|||
}
|
||||
}
|
||||
gf_do_final_region_alignment(&rd);
|
||||
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
static
|
||||
int gf_w32_split_init(gf_t *gf)
|
||||
|
@ -2295,23 +2235,13 @@ int gf_w32_split_init(gf_t *gf)
|
|||
struct gf_split_8_32_lazy_data *d32;
|
||||
struct gf_split_16_32_lazy_data *d16;
|
||||
uint32_t p, basep;
|
||||
int i, j, exp, ispclmul, issse3;
|
||||
|
||||
ispclmul = 0;
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
ispclmul = 1;
|
||||
#endif
|
||||
|
||||
issse3 = 0;
|
||||
#ifdef INTEL_SSSE3
|
||||
issse3 = 1;
|
||||
#endif
|
||||
int i, j, exp;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
/* Defaults */
|
||||
|
||||
gf->inverse.w32 = gf_w32_euclid;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_euclid)
|
||||
|
||||
/* JSP: First handle single multiplication:
|
||||
If args == 8, then we're doing split 8 8.
|
||||
|
@ -2320,17 +2250,19 @@ int gf_w32_split_init(gf_t *gf)
|
|||
*/
|
||||
|
||||
if (h->arg1 == 8 && h->arg2 == 8) {
|
||||
gf->multiply.w32 = gf_w32_split_8_8_multiply;
|
||||
} else if (ispclmul) {
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_split_8_8_multiply)
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
} else if (gf_cpu_supports_intel_pclmul) {
|
||||
if ((0xfffe0000 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w32_clm_multiply_2;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_clm_multiply_2)
|
||||
} else if ((0xffc00000 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w32_clm_multiply_3;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_clm_multiply_3)
|
||||
} else if ((0xfe000000 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w32_clm_multiply_4;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_clm_multiply_4)
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w32_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_bytwo_p_multiply)
|
||||
}
|
||||
|
||||
/* Easy cases: 16/32 and 2/32 */
|
||||
|
@ -2338,7 +2270,7 @@ int gf_w32_split_init(gf_t *gf)
|
|||
if ((h->arg1 == 16 && h->arg2 == 32) || (h->arg1 == 32 && h->arg2 == 16)) {
|
||||
d16 = (struct gf_split_16_32_lazy_data *) h->private;
|
||||
d16->last_value = 0;
|
||||
gf->multiply_region.w32 = gf_w32_split_16_32_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_16_32_lazy_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -2346,29 +2278,39 @@ int gf_w32_split_init(gf_t *gf)
|
|||
ld2 = (struct gf_split_2_32_lazy_data *) h->private;
|
||||
ld2->last_value = 0;
|
||||
#ifdef INTEL_SSSE3
|
||||
if (!(h->region_type & GF_REGION_NOSSE))
|
||||
gf->multiply_region.w32 = gf_w32_split_2_32_lazy_sse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w32_split_2_32_lazy_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w32_split_2_32_lazy_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE) return 0;
|
||||
if (gf_cpu_supports_intel_ssse3 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_2_32_lazy_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_2_32_lazy_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD) return 0;
|
||||
#ifdef INTEL_SSSE3
|
||||
}
|
||||
#endif
|
||||
return 1;
|
||||
}
|
||||
|
||||
/* 4/32 or Default + SSE - There is no ALTMAP/NOSSE. */
|
||||
|
||||
|
||||
if ((h->arg1 == 4 && h->arg2 == 32) || (h->arg1 == 32 && h->arg2 == 4) ||
|
||||
(issse3 && h->mult_type == GF_REGION_DEFAULT)) {
|
||||
((gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon) && h->mult_type == GF_REGION_DEFAULT)) {
|
||||
ld4 = (struct gf_split_4_32_lazy_data *) h->private;
|
||||
ld4->last_value = 0;
|
||||
if ((h->region_type & GF_REGION_NOSSE) || !issse3) {
|
||||
gf->multiply_region.w32 = gf_w32_split_4_32_lazy_multiply_region;
|
||||
if ((h->region_type & GF_REGION_NOSIMD) || !(gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_4_32_lazy_multiply_region)
|
||||
} else if (gf_cpu_supports_arm_neon) {
|
||||
#ifdef ARM_NEON
|
||||
gf_w32_neon_split_init(gf);
|
||||
#endif
|
||||
} else if (h->region_type & GF_REGION_ALTMAP) {
|
||||
gf->multiply_region.w32 = gf_w32_split_4_32_lazy_sse_altmap_multiply_region;
|
||||
#ifdef INTEL_SSSE3
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_4_32_lazy_sse_altmap_multiply_region)
|
||||
#endif
|
||||
} else {
|
||||
gf->multiply_region.w32 = gf_w32_split_4_32_lazy_sse_multiply_region;
|
||||
#ifdef INTEL_SSSE3
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_4_32_lazy_sse_multiply_region)
|
||||
#endif
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
@ -2379,7 +2321,7 @@ int gf_w32_split_init(gf_t *gf)
|
|||
h->mult_type == GF_MULT_DEFAULT) {
|
||||
d32 = (struct gf_split_8_32_lazy_data *) h->private;
|
||||
d32->last_value = 0;
|
||||
gf->multiply_region.w32 = gf_w32_split_8_32_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_8_32_lazy_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -2388,8 +2330,8 @@ int gf_w32_split_init(gf_t *gf)
|
|||
if (h->arg1 == 8 && h->arg2 == 8) {
|
||||
d8 = (struct gf_w32_split_8_8_data *) h->private;
|
||||
d8->last_value = 0;
|
||||
gf->multiply.w32 = gf_w32_split_8_8_multiply;
|
||||
gf->multiply_region.w32 = gf_w32_split_8_32_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_split_8_8_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_8_32_lazy_multiply_region)
|
||||
basep = 1;
|
||||
for (exp = 0; exp < 7; exp++) {
|
||||
for (j = 0; j < 256; j++) d8->tables[exp][0][j] = 0;
|
||||
|
@ -2430,7 +2372,7 @@ int gf_w32_group_init(gf_t *gf)
|
|||
uint32_t i, j, p, index;
|
||||
struct gf_w32_group_data *gd;
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
int g_r, g_s;
|
||||
uint32_t g_r, g_s;
|
||||
|
||||
g_s = h->arg1;
|
||||
g_r = h->arg2;
|
||||
|
@ -2448,7 +2390,7 @@ int gf_w32_group_init(gf_t *gf)
|
|||
gd->tshift = ((gd->tshift-1)/g_r) * g_r;
|
||||
|
||||
gd->reduce[0] = 0;
|
||||
for (i = 0; i < (1 << g_r); i++) {
|
||||
for (i = 0; i < ((uint32_t)1 << g_r); i++) {
|
||||
p = 0;
|
||||
index = 0;
|
||||
for (j = 0; j < g_r; j++) {
|
||||
|
@ -2462,14 +2404,14 @@ int gf_w32_group_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (g_s == g_r) {
|
||||
gf->multiply.w32 = gf_w32_group_s_equals_r_multiply;
|
||||
gf->multiply_region.w32 = gf_w32_group_s_equals_r_multiply_region;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_group_s_equals_r_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_group_s_equals_r_multiply_region)
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w32_group_multiply;
|
||||
gf->multiply_region.w32 = gf_w32_group_multiply_region;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_group_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_group_multiply_region)
|
||||
}
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = gf_w32_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_euclid)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -2721,18 +2663,18 @@ int gf_w32_composite_init(gf_t *gf)
|
|||
cd->alog = gf_w16_get_mult_alog_table(h->base_gf);
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP) {
|
||||
gf->multiply_region.w32 = gf_w32_composite_multiply_region_alt;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_composite_multiply_region_alt)
|
||||
} else {
|
||||
gf->multiply_region.w32 = gf_w32_composite_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_composite_multiply_region)
|
||||
}
|
||||
|
||||
if (cd->log == NULL) {
|
||||
gf->multiply.w32 = gf_w32_composite_multiply_recursive;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_composite_multiply_recursive)
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w32_composite_multiply_inline;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w32_composite_multiply_inline)
|
||||
}
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = gf_w32_composite_inverse;
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_composite_inverse)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -2741,12 +2683,6 @@ int gf_w32_composite_init(gf_t *gf)
|
|||
|
||||
int gf_w32_scratch_size(int mult_type, int region_type, int divide_type, int arg1, int arg2)
|
||||
{
|
||||
int issse3 = 0;
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
issse3 = 1;
|
||||
#endif
|
||||
|
||||
switch(mult_type)
|
||||
{
|
||||
case GF_MULT_BYTWO_p:
|
||||
|
@ -2771,7 +2707,7 @@ int gf_w32_scratch_size(int mult_type, int region_type, int divide_type, int arg
|
|||
return sizeof(gf_internal_t) + sizeof(struct gf_split_2_32_lazy_data) + 64;
|
||||
}
|
||||
if ((arg1 == 8 && arg2 == 32) || (arg2 == 8 && arg1 == 32) ||
|
||||
(mult_type == GF_MULT_DEFAULT && !issse3)) {
|
||||
(mult_type == GF_MULT_DEFAULT && !(gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon))) {
|
||||
return sizeof(gf_internal_t) + sizeof(struct gf_split_8_32_lazy_data) + 64;
|
||||
}
|
||||
if ((arg1 == 4 && arg2 == 32) ||
|
||||
|
@ -2783,7 +2719,6 @@ int gf_w32_scratch_size(int mult_type, int region_type, int divide_type, int arg
|
|||
case GF_MULT_CARRY_FREE:
|
||||
return sizeof(gf_internal_t);
|
||||
break;
|
||||
//ADAM
|
||||
case GF_MULT_CARRY_FREE_GK:
|
||||
return sizeof(gf_internal_t) + sizeof(uint64_t)*2;
|
||||
break;
|
||||
|
@ -2828,14 +2763,14 @@ int gf_w32_init(gf_t *gf)
|
|||
|
||||
if(h->mult_type != GF_MULT_COMPOSITE) h->prim_poly &= 0xffffffff;
|
||||
|
||||
gf->multiply.w32 = NULL;
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->multiply_region.w32 = NULL;
|
||||
SET_FUNCTION(gf,multiply,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w32,NULL)
|
||||
|
||||
switch(h->mult_type) {
|
||||
case GF_MULT_CARRY_FREE: if (gf_w32_cfm_init(gf) == 0) return 0; break;
|
||||
case GF_MULT_CARRY_FREE_GK: if (gf_w32_cfmgk_init(gf) == 0) return 0; break; //ADAM
|
||||
case GF_MULT_CARRY_FREE_GK: if (gf_w32_cfmgk_init(gf) == 0) return 0; break;
|
||||
case GF_MULT_SHIFT: if (gf_w32_shift_init(gf) == 0) return 0; break;
|
||||
case GF_MULT_COMPOSITE: if (gf_w32_composite_init(gf) == 0) return 0; break;
|
||||
case GF_MULT_DEFAULT:
|
||||
|
@ -2846,30 +2781,30 @@ int gf_w32_init(gf_t *gf)
|
|||
default: return 0;
|
||||
}
|
||||
if (h->divide_type == GF_DIVIDE_EUCLID) {
|
||||
gf->divide.w32 = gf_w32_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w32_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w32_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_euclid)
|
||||
} else if (h->divide_type == GF_DIVIDE_MATRIX) {
|
||||
gf->divide.w32 = gf_w32_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w32_matrix;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w32_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_matrix)
|
||||
}
|
||||
|
||||
if (gf->inverse.w32 != NULL && gf->divide.w32 == NULL) {
|
||||
gf->divide.w32 = gf_w32_divide_from_inverse;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w32_divide_from_inverse)
|
||||
}
|
||||
if (gf->inverse.w32 == NULL && gf->divide.w32 != NULL) {
|
||||
gf->inverse.w32 = gf_w32_inverse_from_divide;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w32_inverse_from_divide)
|
||||
}
|
||||
if (h->region_type == GF_REGION_CAUCHY) {
|
||||
gf->extract_word.w32 = gf_wgen_extract_word;
|
||||
gf->multiply_region.w32 = gf_wgen_cauchy_region;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_wgen_extract_word)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_wgen_cauchy_region)
|
||||
} else if (h->region_type & GF_REGION_ALTMAP) {
|
||||
if (h->mult_type == GF_MULT_COMPOSITE) {
|
||||
gf->extract_word.w32 = gf_w32_composite_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w32_composite_extract_word)
|
||||
} else {
|
||||
gf->extract_word.w32 = gf_w32_split_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w32_split_extract_word)
|
||||
}
|
||||
} else {
|
||||
gf->extract_word.w32 = gf_w32_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w32_extract_word)
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
|
212
src/gf_w4.c
|
@ -11,49 +11,8 @@
|
|||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
|
||||
#define GF_FIELD_WIDTH 4
|
||||
#define GF_DOUBLE_WIDTH (GF_FIELD_WIDTH*2)
|
||||
#define GF_FIELD_SIZE (1 << GF_FIELD_WIDTH)
|
||||
#define GF_MULT_GROUP_SIZE (GF_FIELD_SIZE-1)
|
||||
|
||||
/* ------------------------------------------------------------
|
||||
JSP: Each implementation has its own data, which is allocated
|
||||
at one time as part of the handle. For that reason, it
|
||||
shouldn't be hierarchical -- i.e. one should be able to
|
||||
allocate it with one call to malloc. */
|
||||
|
||||
struct gf_logtable_data {
|
||||
uint8_t log_tbl[GF_FIELD_SIZE];
|
||||
uint8_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint8_t *antilog_tbl_div;
|
||||
};
|
||||
|
||||
struct gf_single_table_data {
|
||||
uint8_t mult[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_double_table_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t mult[GF_FIELD_SIZE][GF_FIELD_SIZE*GF_FIELD_SIZE];
|
||||
};
|
||||
struct gf_quad_table_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[GF_FIELD_SIZE][(1<<16)];
|
||||
};
|
||||
|
||||
struct gf_quad_table_lazy_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t smult[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[(1 << 16)];
|
||||
};
|
||||
|
||||
struct gf_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
#include "gf_w4.h"
|
||||
#include "gf_cpu.h"
|
||||
|
||||
#define AB2(ip, am1 ,am2, b, t1, t2) {\
|
||||
t1 = (b << 1) & am1;\
|
||||
|
@ -176,6 +135,7 @@ gf_w4_shift_multiply (gf_t *gf, gf_val_32_t a, gf_val_32_t b)
|
|||
|
||||
/* Ben: This function works, but it is 33% slower than the normal shift mult */
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -183,8 +143,6 @@ gf_w4_clm_multiply (gf_t *gf, gf_val_32_t a4, gf_val_32_t b4)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -215,9 +173,9 @@ gf_w4_clm_multiply (gf_t *gf, gf_val_32_t a4, gf_val_32_t b4)
|
|||
/* Extracts 32 bit value from result. */
|
||||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
static
|
||||
void
|
||||
|
@ -353,10 +311,10 @@ int gf_w4_log_init(gf_t *gf)
|
|||
return 0;
|
||||
}
|
||||
|
||||
gf->inverse.w32 = gf_w4_inverse_from_divide;
|
||||
gf->divide.w32 = gf_w4_log_divide;
|
||||
gf->multiply.w32 = gf_w4_log_multiply;
|
||||
gf->multiply_region.w32 = gf_w4_log_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w4_inverse_from_divide)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_log_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_log_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_log_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -486,17 +444,22 @@ int gf_w4_single_table_init(gf_t *gf)
|
|||
}
|
||||
}
|
||||
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->divide.w32 = gf_w4_single_table_divide;
|
||||
gf->multiply.w32 = gf_w4_single_table_multiply;
|
||||
#ifdef INTEL_SSSE3
|
||||
if(h->region_type & (GF_REGION_NOSSE | GF_REGION_CAUCHY))
|
||||
gf->multiply_region.w32 = gf_w4_single_table_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w4_single_table_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w4_single_table_multiply_region;
|
||||
if (h->region_type & GF_REGION_SSE) return 0;
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_single_table_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_single_table_multiply)
|
||||
#if defined(INTEL_SSSE3)
|
||||
if (gf_cpu_supports_intel_ssse3 && !(h->region_type & (GF_REGION_NOSIMD | GF_REGION_CAUCHY))) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_single_table_sse_multiply_region)
|
||||
} else {
|
||||
#elif defined(ARM_NEON)
|
||||
if (gf_cpu_supports_arm_neon && !(h->region_type & (GF_REGION_NOSIMD | GF_REGION_CAUCHY))) {
|
||||
gf_w4_neon_single_table_init(gf);
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_single_table_multiply_region)
|
||||
if (h->region_type & GF_REGION_SIMD) return 0;
|
||||
#if defined(INTEL_SSSE3) || defined(ARM_NEON)
|
||||
}
|
||||
#endif
|
||||
|
||||
return 1;
|
||||
|
@ -586,10 +549,10 @@ int gf_w4_double_table_init(gf_t *gf)
|
|||
}
|
||||
}
|
||||
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->divide.w32 = gf_w4_double_table_divide;
|
||||
gf->multiply.w32 = gf_w4_double_table_multiply;
|
||||
gf->multiply_region.w32 = gf_w4_double_table_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_double_table_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_double_table_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_double_table_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -720,10 +683,10 @@ int gf_w4_quad_table_init(gf_t *gf)
|
|||
}
|
||||
}
|
||||
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->divide.w32 = gf_w4_quad_table_divide;
|
||||
gf->multiply.w32 = gf_w4_quad_table_multiply;
|
||||
gf->multiply_region.w32 = gf_w4_quad_table_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_quad_table_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_quad_table_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_quad_table_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
static
|
||||
|
@ -762,10 +725,10 @@ int gf_w4_quad_table_lazy_init(gf_t *gf)
|
|||
}
|
||||
}
|
||||
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->divide.w32 = gf_w4_quad_table_lazy_divide;
|
||||
gf->multiply.w32 = gf_w4_quad_table_lazy_multiply;
|
||||
gf->multiply_region.w32 = gf_w4_quad_table_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_quad_table_lazy_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_quad_table_lazy_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_quad_table_multiply_region)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -774,16 +737,13 @@ int gf_w4_table_init(gf_t *gf)
|
|||
{
|
||||
int rt;
|
||||
gf_internal_t *h;
|
||||
int issse3 = 0;
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
issse3 = 1;
|
||||
#endif
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
rt = (h->region_type);
|
||||
|
||||
if (h->mult_type == GF_MULT_DEFAULT && !issse3) rt |= GF_REGION_DOUBLE_TABLE;
|
||||
if (h->mult_type == GF_MULT_DEFAULT &&
|
||||
!(gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon))
|
||||
rt |= GF_REGION_DOUBLE_TABLE;
|
||||
|
||||
if (rt & GF_REGION_DOUBLE_TABLE) {
|
||||
return gf_w4_double_table_init(gf);
|
||||
|
@ -967,11 +927,11 @@ gf_w4_bytwo_p_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_32_t v
|
|||
#endif
|
||||
|
||||
/*
|
||||
#ifdef INTEL_SSE2
|
||||
static
|
||||
void
|
||||
gf_w4_bytwo_b_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
#ifdef INTEL_SSE2
|
||||
uint8_t *d8, *s8, tb;
|
||||
__m128i pp, m1, m2, t1, t2, va, vb;
|
||||
struct gf_bytwo_data *btd;
|
||||
|
@ -1028,8 +988,8 @@ gf_w4_bytwo_b_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_32_t v
|
|||
}
|
||||
}
|
||||
gf_do_final_region_alignment(&rd);
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
*/
|
||||
|
||||
#ifdef INTEL_SSE2
|
||||
|
@ -1903,28 +1863,30 @@ int gf_w4_bytwo_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (h->mult_type == GF_MULT_BYTWO_p) {
|
||||
gf->multiply.w32 = gf_w4_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_bytwo_p_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w4_bytwo_p_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w4_bytwo_p_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w4_bytwo_p_nosse_multiply_region;
|
||||
if (h->region_type & GF_REGION_SSE)
|
||||
return 0;
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_bytwo_p_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_bytwo_p_nosse_multiply_region)
|
||||
if (h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w4_bytwo_b_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_bytwo_b_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w4_bytwo_b_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w4_bytwo_b_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w4_bytwo_b_nosse_multiply_region;
|
||||
if (h->region_type & GF_REGION_SSE)
|
||||
return 0;
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_bytwo_b_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_bytwo_b_nosse_multiply_region)
|
||||
if (h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
}
|
||||
return 1;
|
||||
|
@ -1935,8 +1897,14 @@ static
|
|||
int gf_w4_cfm_init(gf_t *gf)
|
||||
{
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf->multiply.w32 = gf_w4_clm_multiply;
|
||||
return 1;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_clm_multiply)
|
||||
return 1;
|
||||
}
|
||||
#elif defined(ARM_NEON)
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
return gf_w4_neon_cfm_init(gf);
|
||||
}
|
||||
#endif
|
||||
return 0;
|
||||
}
|
||||
|
@ -1944,7 +1912,7 @@ int gf_w4_cfm_init(gf_t *gf)
|
|||
static
|
||||
int gf_w4_shift_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w32 = gf_w4_shift_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_shift_multiply)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -1953,12 +1921,6 @@ int gf_w4_shift_init(gf_t *gf)
|
|||
|
||||
int gf_w4_scratch_size(int mult_type, int region_type, int divide_type, int arg1, int arg2)
|
||||
{
|
||||
int issse3 = 0;
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
issse3 = 1;
|
||||
#endif
|
||||
|
||||
switch(mult_type)
|
||||
{
|
||||
case GF_MULT_BYTWO_p:
|
||||
|
@ -1971,7 +1933,9 @@ int gf_w4_scratch_size(int mult_type, int region_type, int divide_type, int arg1
|
|||
return sizeof(gf_internal_t) + sizeof(struct gf_single_table_data) + 64;
|
||||
}
|
||||
|
||||
if (mult_type == GF_MULT_DEFAULT && !issse3) region_type = GF_REGION_DOUBLE_TABLE;
|
||||
if (mult_type == GF_MULT_DEFAULT &&
|
||||
!(gf_cpu_supports_arm_neon || gf_cpu_supports_intel_ssse3))
|
||||
region_type = GF_REGION_DOUBLE_TABLE;
|
||||
|
||||
if (region_type & GF_REGION_DOUBLE_TABLE) {
|
||||
return sizeof(gf_internal_t) + sizeof(struct gf_double_table_data) + 64;
|
||||
|
@ -2009,11 +1973,11 @@ gf_w4_init (gf_t *gf)
|
|||
h = (gf_internal_t *) gf->scratch;
|
||||
if (h->prim_poly == 0) h->prim_poly = 0x13;
|
||||
h->prim_poly |= 0x10;
|
||||
gf->multiply.w32 = NULL;
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->multiply_region.w32 = NULL;
|
||||
gf->extract_word.w32 = gf_w4_extract_word;
|
||||
SET_FUNCTION(gf,multiply,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w32,NULL)
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w4_extract_word)
|
||||
|
||||
switch(h->mult_type) {
|
||||
case GF_MULT_CARRY_FREE: if (gf_w4_cfm_init(gf) == 0) return 0; break;
|
||||
|
@ -2027,27 +1991,27 @@ gf_w4_init (gf_t *gf)
|
|||
}
|
||||
|
||||
if (h->divide_type == GF_DIVIDE_EUCLID) {
|
||||
gf->divide.w32 = gf_w4_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w4_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w4_euclid)
|
||||
} else if (h->divide_type == GF_DIVIDE_MATRIX) {
|
||||
gf->divide.w32 = gf_w4_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w4_matrix;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w4_matrix)
|
||||
}
|
||||
|
||||
if (gf->divide.w32 == NULL) {
|
||||
gf->divide.w32 = gf_w4_divide_from_inverse;
|
||||
if (gf->inverse.w32 == NULL) gf->inverse.w32 = gf_w4_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w4_divide_from_inverse)
|
||||
if (gf->inverse.w32 == NULL) SET_FUNCTION(gf,inverse,w32,gf_w4_euclid)
|
||||
}
|
||||
|
||||
if (gf->inverse.w32 == NULL) gf->inverse.w32 = gf_w4_inverse_from_divide;
|
||||
if (gf->inverse.w32 == NULL) SET_FUNCTION(gf,inverse,w32,gf_w4_inverse_from_divide)
|
||||
|
||||
if (h->region_type == GF_REGION_CAUCHY) {
|
||||
gf->multiply_region.w32 = gf_wgen_cauchy_region;
|
||||
gf->extract_word.w32 = gf_wgen_extract_word;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_wgen_cauchy_region)
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_wgen_extract_word)
|
||||
}
|
||||
|
||||
if (gf->multiply_region.w32 == NULL) {
|
||||
gf->multiply_region.w32 = gf_w4_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_multiply_region_from_single)
|
||||
}
|
||||
|
||||
return 1;
|
||||
|
|
315
src/gf_w64.c
|
@ -11,38 +11,8 @@
|
|||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (64)
|
||||
#define GF_FIRST_BIT (1ULL << 63)
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (32)
|
||||
#define GF_BASE_FIELD_SIZE (1ULL << GF_BASE_FIELD_WIDTH)
|
||||
#define GF_BASE_FIELD_GROUP_SIZE GF_BASE_FIELD_SIZE-1
|
||||
|
||||
struct gf_w64_group_data {
|
||||
uint64_t *reduce;
|
||||
uint64_t *shift;
|
||||
uint64_t *memory;
|
||||
};
|
||||
|
||||
struct gf_split_4_64_lazy_data {
|
||||
uint64_t tables[16][16];
|
||||
uint64_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_8_64_lazy_data {
|
||||
uint64_t tables[8][(1<<8)];
|
||||
uint64_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_16_64_lazy_data {
|
||||
uint64_t tables[4][(1<<16)];
|
||||
uint64_t last_value;
|
||||
};
|
||||
|
||||
struct gf_split_8_8_data {
|
||||
uint64_t tables[15][256][256];
|
||||
};
|
||||
#include "gf_w64.h"
|
||||
#include "gf_cpu.h"
|
||||
|
||||
static
|
||||
inline
|
||||
|
@ -66,7 +36,7 @@ void
|
|||
gf_w64_multiply_region_from_single(gf_t *gf, void *src, void *dest, gf_val_64_t val, int bytes, int
|
||||
xor)
|
||||
{
|
||||
int i;
|
||||
uint32_t i;
|
||||
gf_val_64_t *s64;
|
||||
gf_val_64_t *d64;
|
||||
|
||||
|
@ -100,7 +70,7 @@ xor)
|
|||
__m128i result, r1;
|
||||
__m128i prim_poly;
|
||||
__m128i w;
|
||||
__m128i m1, m2, m3, m4;
|
||||
__m128i m1, m3, m4;
|
||||
gf_internal_t * h = gf->scratch;
|
||||
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; }
|
||||
|
@ -112,8 +82,6 @@ xor)
|
|||
prim_poly = _mm_set_epi32(0, 0, 0, (uint32_t)(h->prim_poly & 0xffffffffULL));
|
||||
b = _mm_insert_epi64 (_mm_setzero_si128(), val, 0);
|
||||
m1 = _mm_set_epi32(0, 0, 0, (uint32_t)0xffffffff);
|
||||
m2 = _mm_slli_si128(m1, 4);
|
||||
m2 = _mm_or_si128(m1, m2);
|
||||
m3 = _mm_slli_si128(m1, 8);
|
||||
m4 = _mm_slli_si128(m3, 4);
|
||||
|
||||
|
@ -321,12 +289,9 @@ gf_w64_shift_multiply (gf_t *gf, gf_val_64_t a64, gf_val_64_t b64)
|
|||
gf_internal_t *h;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
ppr = h->prim_poly;
|
||||
|
||||
/* Allen: set leading one of primitive polynomial */
|
||||
|
||||
ppl = 1;
|
||||
|
||||
a = a64;
|
||||
bl = 0;
|
||||
br = b64;
|
||||
|
@ -374,6 +339,8 @@ gf_w64_shift_multiply (gf_t *gf, gf_val_64_t a64, gf_val_64_t b64)
|
|||
* ELM: Use the Intel carryless multiply instruction to do very fast 64x64 multiply.
|
||||
*/
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
static
|
||||
inline
|
||||
gf_val_64_t
|
||||
|
@ -381,8 +348,6 @@ gf_w64_clm_multiply_2 (gf_t *gf, gf_val_64_t a64, gf_val_64_t b64)
|
|||
{
|
||||
gf_val_64_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -412,10 +377,12 @@ gf_w64_clm_multiply_2 (gf_t *gf, gf_val_64_t a64, gf_val_64_t b64)
|
|||
result = _mm_xor_si128 (result, w);
|
||||
|
||||
rv = ((gf_val_64_t)_mm_extract_epi64(result, 0));
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
static
|
||||
inline
|
||||
gf_val_64_t
|
||||
|
@ -423,8 +390,6 @@ gf_w64_clm_multiply_4 (gf_t *gf, gf_val_64_t a64, gf_val_64_t b64)
|
|||
{
|
||||
gf_val_64_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -454,15 +419,15 @@ gf_w64_clm_multiply_4 (gf_t *gf, gf_val_64_t a64, gf_val_64_t b64)
|
|||
result = _mm_xor_si128 (result, w);
|
||||
|
||||
rv = ((gf_val_64_t)_mm_extract_epi64(result, 0));
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
void
|
||||
gf_w64_clm_multiply_region(gf_t *gf, void *src, void *dest, uint64_t val, int bytes, int xor)
|
||||
{
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf_internal_t *h;
|
||||
uint8_t *s8, *d8, *dtop;
|
||||
gf_region_data rd;
|
||||
|
@ -540,8 +505,8 @@ gf_w64_clm_multiply_region(gf_t *gf, void *src, void *dest, uint64_t val, int by
|
|||
}
|
||||
}
|
||||
gf_do_final_region_alignment(&rd);
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
void
|
||||
gf_w64_split_4_64_lazy_multiply_region(gf_t *gf, void *src, void *dest, uint64_t val, int bytes, int xor)
|
||||
|
@ -733,33 +698,35 @@ gf_w64_split_16_64_lazy_multiply_region(gf_t *gf, void *src, void *dest, uint64_
|
|||
static
|
||||
int gf_w64_shift_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w64 = gf_w64_shift_multiply;
|
||||
gf->inverse.w64 = gf_w64_euclid;
|
||||
gf->multiply_region.w64 = gf_w64_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_shift_multiply)
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_multiply_region_from_single)
|
||||
return 1;
|
||||
}
|
||||
|
||||
static
|
||||
int gf_w64_cfm_init(gf_t *gf)
|
||||
{
|
||||
gf->inverse.w64 = gf_w64_euclid;
|
||||
gf->multiply_region.w64 = gf_w64_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_euclid)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_multiply_region_from_single)
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf_internal_t *h;
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
gf_internal_t *h;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if ((0xfffffffe00000000ULL & h->prim_poly) == 0){
|
||||
gf->multiply.w64 = gf_w64_clm_multiply_2;
|
||||
gf->multiply_region.w64 = gf_w64_clm_multiply_region_from_single_2;
|
||||
}else if((0xfffe000000000000ULL & h->prim_poly) == 0){
|
||||
gf->multiply.w64 = gf_w64_clm_multiply_4;
|
||||
gf->multiply_region.w64 = gf_w64_clm_multiply_region_from_single_4;
|
||||
} else {
|
||||
return 0;
|
||||
if ((0xfffffffe00000000ULL & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_clm_multiply_2)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_clm_multiply_region_from_single_2)
|
||||
}else if((0xfffe000000000000ULL & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_clm_multiply_4)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_clm_multiply_region_from_single_4)
|
||||
} else {
|
||||
return 0;
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
return 1;
|
||||
#endif
|
||||
|
||||
return 0;
|
||||
|
@ -769,7 +736,7 @@ static
|
|||
void
|
||||
gf_w64_group_set_shift_tables(uint64_t *shift, uint64_t val, gf_internal_t *h)
|
||||
{
|
||||
int i;
|
||||
uint64_t i;
|
||||
uint64_t j;
|
||||
uint64_t one = 1;
|
||||
int g_s;
|
||||
|
@ -777,7 +744,7 @@ gf_w64_group_set_shift_tables(uint64_t *shift, uint64_t val, gf_internal_t *h)
|
|||
g_s = h->arg1;
|
||||
shift[0] = 0;
|
||||
|
||||
for (i = 1; i < (1 << g_s); i <<= 1) {
|
||||
for (i = 1; i < ((uint64_t)1 << g_s); i <<= 1) {
|
||||
for (j = 0; j < i; j++) shift[i|j] = shift[j]^val;
|
||||
if (val & (one << 63)) {
|
||||
val <<= 1;
|
||||
|
@ -803,7 +770,7 @@ gf_w64_group_multiply(gf_t *gf, gf_val_64_t a, gf_val_64_t b)
|
|||
gd = (struct gf_w64_group_data *) h->private;
|
||||
gf_w64_group_set_shift_tables(gd->shift, b, h);
|
||||
|
||||
mask = ((1 << g_s) - 1);
|
||||
mask = (((uint64_t)1 << g_s) - 1);
|
||||
top = 0;
|
||||
bot = gd->shift[a&mask];
|
||||
a >>= g_s;
|
||||
|
@ -827,7 +794,7 @@ gf_w64_group_multiply(gf_t *gf, gf_val_64_t a, gf_val_64_t b)
|
|||
|
||||
lshift = ((lshift-1) / g_r) * g_r;
|
||||
rshift = 64 - lshift;
|
||||
mask = (1 << g_r) - 1;
|
||||
mask = ((uint64_t)1 << g_r) - 1;
|
||||
while (lshift >= 0) {
|
||||
tp = gd->reduce[(top >> lshift) & mask];
|
||||
top ^= (tp >> rshift);
|
||||
|
@ -876,8 +843,8 @@ void gf_w64_group_multiply_region(gf_t *gf, void *src, void *dest, gf_val_64_t v
|
|||
d64 = (uint64_t *) rd.d_start;
|
||||
dtop = (uint64_t *) rd.d_top;
|
||||
|
||||
smask = (1 << g_s) - 1;
|
||||
rmask = (1 << g_r) - 1;
|
||||
smask = ((uint64_t)1 << g_s) - 1;
|
||||
rmask = ((uint64_t)1 << g_r) - 1;
|
||||
|
||||
while (d64 < dtop) {
|
||||
a64 = *s64;
|
||||
|
@ -1020,7 +987,7 @@ int gf_w64_group_init(gf_t *gf)
|
|||
uint64_t i, j, p, index;
|
||||
struct gf_w64_group_data *gd;
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
int g_r, g_s;
|
||||
uint64_t g_r, g_s;
|
||||
|
||||
g_s = h->arg1;
|
||||
g_r = h->arg2;
|
||||
|
@ -1030,7 +997,7 @@ int gf_w64_group_init(gf_t *gf)
|
|||
gd->reduce = gd->shift + (1 << g_s);
|
||||
|
||||
gd->reduce[0] = 0;
|
||||
for (i = 0; i < (1 << g_r); i++) {
|
||||
for (i = 0; i < ((uint64_t)1 << g_r); i++) {
|
||||
p = 0;
|
||||
index = 0;
|
||||
for (j = 0; j < g_r; j++) {
|
||||
|
@ -1044,14 +1011,14 @@ int gf_w64_group_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (g_s == g_r) {
|
||||
gf->multiply.w64 = gf_w64_group_s_equals_r_multiply;
|
||||
gf->multiply_region.w64 = gf_w64_group_s_equals_r_multiply_region;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_group_s_equals_r_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_group_s_equals_r_multiply_region)
|
||||
} else {
|
||||
gf->multiply.w64 = gf_w64_group_multiply;
|
||||
gf->multiply_region.w64 = gf_w64_group_multiply_region;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_group_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_group_multiply_region)
|
||||
}
|
||||
gf->divide.w64 = NULL;
|
||||
gf->inverse.w64 = gf_w64_euclid;
|
||||
SET_FUNCTION(gf,divide,w64,NULL)
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_euclid)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -1297,9 +1264,9 @@ gf_w64_bytwo_b_nosse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_64_
|
|||
v = _mm_srli_epi64(v, 1); }
|
||||
|
||||
|
||||
#ifdef INTEL_SSE2
|
||||
void gf_w64_bytwo_p_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_64_t val, int bytes, int xor)
|
||||
{
|
||||
#ifdef INTEL_SSE2
|
||||
int i;
|
||||
uint8_t *s8, *d8;
|
||||
uint64_t vrev, one64;
|
||||
|
@ -1358,8 +1325,8 @@ void gf_w64_bytwo_p_sse_multiply_region(gf_t *gf, void *src, void *dest, gf_val_
|
|||
s8 += 16;
|
||||
}
|
||||
gf_do_final_region_alignment(&rd);
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef INTEL_SSE2
|
||||
static
|
||||
|
@ -1491,31 +1458,33 @@ int gf_w64_bytwo_init(gf_t *gf)
|
|||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if (h->mult_type == GF_MULT_BYTWO_p) {
|
||||
gf->multiply.w64 = gf_w64_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_bytwo_p_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w64 = gf_w64_bytwo_p_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w64 = gf_w64_bytwo_p_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w64 = gf_w64_bytwo_p_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
return 0;
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_bytwo_p_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_bytwo_p_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
gf->multiply.w64 = gf_w64_bytwo_b_multiply;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_bytwo_b_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w64 = gf_w64_bytwo_b_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w64 = gf_w64_bytwo_b_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w64 = gf_w64_bytwo_b_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_bytwo_b_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_bytwo_b_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
}
|
||||
gf->inverse.w64 = gf_w64_euclid;
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_euclid)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -1689,14 +1658,14 @@ int gf_w64_composite_init(gf_t *gf)
|
|||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP) {
|
||||
gf->multiply_region.w64 = gf_w64_composite_multiply_region_alt;
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_composite_multiply_region_alt)
|
||||
} else {
|
||||
gf->multiply_region.w64 = gf_w64_composite_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_composite_multiply_region)
|
||||
}
|
||||
|
||||
gf->multiply.w64 = gf_w64_composite_multiply;
|
||||
gf->divide.w64 = NULL;
|
||||
gf->inverse.w64 = gf_w64_composite_inverse;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_composite_multiply)
|
||||
SET_FUNCTION(gf,divide,w64,NULL)
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_composite_inverse)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -2006,86 +1975,109 @@ int gf_w64_split_init(gf_t *gf)
|
|||
|
||||
/* Defaults */
|
||||
|
||||
gf->multiply_region.w64 = gf_w64_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_multiply_region_from_single)
|
||||
|
||||
gf->multiply.w64 = gf_w64_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_bytwo_p_multiply)
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
if ((!(h->region_type & GF_REGION_NOSSE) &&
|
||||
(h->arg1 == 64 || h->arg2 == 64)) ||
|
||||
h->mult_type == GF_MULT_DEFAULT){
|
||||
|
||||
if ((0xfffffffe00000000ULL & h->prim_poly) == 0){
|
||||
gf->multiply.w64 = gf_w64_clm_multiply_2;
|
||||
gf->multiply_region.w64 = gf_w64_clm_multiply_region_from_single_2;
|
||||
}else if((0xfffe000000000000ULL & h->prim_poly) == 0){
|
||||
gf->multiply.w64 = gf_w64_clm_multiply_4;
|
||||
gf->multiply_region.w64 = gf_w64_clm_multiply_region_from_single_4;
|
||||
}else{
|
||||
return 0;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
if ((!(h->region_type & GF_REGION_NOSIMD) &&
|
||||
(h->arg1 == 64 || h->arg2 == 64)) ||
|
||||
h->mult_type == GF_MULT_DEFAULT){
|
||||
|
||||
if ((0xfffffffe00000000ULL & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_clm_multiply_2)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_clm_multiply_region_from_single_2)
|
||||
}else if((0xfffe000000000000ULL & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_clm_multiply_4)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_clm_multiply_region_from_single_4)
|
||||
}else{
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
}
|
||||
#endif
|
||||
|
||||
gf->inverse.w64 = gf_w64_euclid;
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_euclid)
|
||||
|
||||
/* Allen: set region pointers for default mult type. Single pointers are
|
||||
* taken care of above (explicitly for sse, implicitly for no sse). */
|
||||
|
||||
#ifdef INTEL_SSE4
|
||||
if (h->mult_type == GF_MULT_DEFAULT) {
|
||||
d4 = (struct gf_split_4_64_lazy_data *) h->private;
|
||||
d4->last_value = 0;
|
||||
gf->multiply_region.w64 = gf_w64_split_4_64_lazy_sse_multiply_region;
|
||||
}
|
||||
#else
|
||||
if (h->mult_type == GF_MULT_DEFAULT) {
|
||||
d8 = (struct gf_split_8_64_lazy_data *) h->private;
|
||||
d8->last_value = 0;
|
||||
gf->multiply_region.w64 = gf_w64_split_8_64_lazy_multiply_region;
|
||||
}
|
||||
#if defined(INTEL_SSE4) || defined(ARCH_AARCH64)
|
||||
if (gf_cpu_supports_intel_sse4 || gf_cpu_supports_arm_neon) {
|
||||
d4 = (struct gf_split_4_64_lazy_data *) h->private;
|
||||
d4->last_value = 0;
|
||||
#if defined(INTEL_SSE4)
|
||||
if (gf_cpu_supports_intel_sse4)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_4_64_lazy_sse_multiply_region)
|
||||
#elif defined(ARCH_AARCH64)
|
||||
if (gf_cpu_supports_arm_neon)
|
||||
gf_w64_neon_split_init(gf);
|
||||
#endif
|
||||
} else {
|
||||
#endif
|
||||
d8 = (struct gf_split_8_64_lazy_data *) h->private;
|
||||
d8->last_value = 0;
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_8_64_lazy_multiply_region)
|
||||
#if defined(INTEL_SSE4) || defined(ARCH_AARCH64)
|
||||
}
|
||||
#endif
|
||||
}
|
||||
|
||||
if ((h->arg1 == 4 && h->arg2 == 64) || (h->arg1 == 64 && h->arg2 == 4)) {
|
||||
d4 = (struct gf_split_4_64_lazy_data *) h->private;
|
||||
d4->last_value = 0;
|
||||
|
||||
if((h->region_type & GF_REGION_ALTMAP) && (h->region_type & GF_REGION_NOSSE)) return 0;
|
||||
if((h->region_type & GF_REGION_ALTMAP) && (h->region_type & GF_REGION_NOSIMD)) return 0;
|
||||
if(h->region_type & GF_REGION_ALTMAP)
|
||||
{
|
||||
#ifdef INTEL_SSSE3
|
||||
gf->multiply_region.w64 = gf_w64_split_4_64_lazy_sse_altmap_multiply_region;
|
||||
#else
|
||||
return 0;
|
||||
if (gf_cpu_supports_intel_ssse3) {
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_4_64_lazy_sse_altmap_multiply_region)
|
||||
} else
|
||||
#elif defined(ARCH_AARCH64)
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
gf_w64_neon_split_init(gf);
|
||||
} else
|
||||
#endif
|
||||
return 0;
|
||||
}
|
||||
else //no altmap
|
||||
{
|
||||
#ifdef INTEL_SSE4
|
||||
if(h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w64 = gf_w64_split_4_64_lazy_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w64 = gf_w64_split_4_64_lazy_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w64 = gf_w64_split_4_64_lazy_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
#if defined(INTEL_SSE4) || defined(ARCH_AARCH64)
|
||||
if(gf_cpu_supports_intel_sse4 || gf_cpu_supports_arm_neon) {
|
||||
if (h->region_type & GF_REGION_NOSIMD) {
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_4_64_lazy_multiply_region)
|
||||
} else
|
||||
#if defined(INTEL_SSE4)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_4_64_lazy_sse_multiply_region)
|
||||
#elif defined(ARCH_AARCH64)
|
||||
gf_w64_neon_split_init(gf);
|
||||
#endif
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_4_64_lazy_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#if defined(INTEL_SSE4) || defined(ARCH_AARCH64)
|
||||
}
|
||||
#endif
|
||||
}
|
||||
}
|
||||
if ((h->arg1 == 8 && h->arg2 == 64) || (h->arg1 == 64 && h->arg2 == 8)) {
|
||||
d8 = (struct gf_split_8_64_lazy_data *) h->private;
|
||||
d8->last_value = 0;
|
||||
gf->multiply_region.w64 = gf_w64_split_8_64_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_8_64_lazy_multiply_region)
|
||||
}
|
||||
if ((h->arg1 == 16 && h->arg2 == 64) || (h->arg1 == 64 && h->arg2 == 16)) {
|
||||
d16 = (struct gf_split_16_64_lazy_data *) h->private;
|
||||
d16->last_value = 0;
|
||||
gf->multiply_region.w64 = gf_w64_split_16_64_lazy_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_16_64_lazy_multiply_region)
|
||||
}
|
||||
if ((h->arg1 == 8 && h->arg2 == 8)) {
|
||||
d88 = (struct gf_split_8_8_data *) h->private;
|
||||
gf->multiply.w64 = gf_w64_split_8_8_multiply;
|
||||
SET_FUNCTION(gf,multiply,w64,gf_w64_split_8_8_multiply)
|
||||
|
||||
/* The performance of this guy sucks, so don't bother with a region op */
|
||||
|
||||
|
@ -2139,12 +2131,16 @@ int gf_w64_scratch_size(int mult_type, int region_type, int divide_type, int arg
|
|||
/* Allen: set the *local* arg1 and arg2, just for scratch size purposes,
|
||||
* then fall through to split table scratch size code. */
|
||||
|
||||
#ifdef INTEL_SSE4
|
||||
#if defined(INTEL_SSE4) || defined(ARCH_AARCH64)
|
||||
if (gf_cpu_supports_intel_sse4 || gf_cpu_supports_arm_neon) {
|
||||
arg1 = 64;
|
||||
arg2 = 4;
|
||||
#else
|
||||
} else {
|
||||
#endif
|
||||
arg1 = 64;
|
||||
arg2 = 8;
|
||||
#if defined(INTEL_SSE4) || defined(ARCH_AARCH64)
|
||||
}
|
||||
#endif
|
||||
|
||||
case GF_MULT_SPLIT_TABLE:
|
||||
|
@ -2179,7 +2175,6 @@ int gf_w64_scratch_size(int mult_type, int region_type, int divide_type, int arg
|
|||
int gf_w64_init(gf_t *gf)
|
||||
{
|
||||
gf_internal_t *h;
|
||||
int no_default_flag = 0;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
|
@ -2194,16 +2189,12 @@ int gf_w64_init(gf_t *gf)
|
|||
} else {
|
||||
h->prim_poly = 0x1b;
|
||||
}
|
||||
if (no_default_flag == 1) {
|
||||
fprintf(stderr,"Code contains no default irreducible polynomial for given base field\n");
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
|
||||
gf->multiply.w64 = NULL;
|
||||
gf->divide.w64 = NULL;
|
||||
gf->inverse.w64 = NULL;
|
||||
gf->multiply_region.w64 = NULL;
|
||||
SET_FUNCTION(gf,multiply,w64,NULL)
|
||||
SET_FUNCTION(gf,divide,w64,NULL)
|
||||
SET_FUNCTION(gf,inverse,w64,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w64,NULL)
|
||||
|
||||
switch(h->mult_type) {
|
||||
case GF_MULT_CARRY_FREE: if (gf_w64_cfm_init(gf) == 0) return 0; break;
|
||||
|
@ -2217,27 +2208,27 @@ int gf_w64_init(gf_t *gf)
|
|||
default: return 0;
|
||||
}
|
||||
if (h->divide_type == GF_DIVIDE_EUCLID) {
|
||||
gf->divide.w64 = gf_w64_divide_from_inverse;
|
||||
gf->inverse.w64 = gf_w64_euclid;
|
||||
SET_FUNCTION(gf,divide,w64,gf_w64_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_euclid)
|
||||
}
|
||||
|
||||
if (gf->inverse.w64 != NULL && gf->divide.w64 == NULL) {
|
||||
gf->divide.w64 = gf_w64_divide_from_inverse;
|
||||
SET_FUNCTION(gf,divide,w64,gf_w64_divide_from_inverse)
|
||||
}
|
||||
if (gf->inverse.w64 == NULL && gf->divide.w64 != NULL) {
|
||||
gf->inverse.w64 = gf_w64_inverse_from_divide;
|
||||
SET_FUNCTION(gf,inverse,w64,gf_w64_inverse_from_divide)
|
||||
}
|
||||
|
||||
if (h->region_type == GF_REGION_CAUCHY) return 0;
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP) {
|
||||
if (h->mult_type == GF_MULT_COMPOSITE) {
|
||||
gf->extract_word.w64 = gf_w64_composite_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w64,gf_w64_composite_extract_word)
|
||||
} else if (h->mult_type == GF_MULT_SPLIT_TABLE) {
|
||||
gf->extract_word.w64 = gf_w64_split_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w64,gf_w64_split_extract_word)
|
||||
}
|
||||
} else {
|
||||
gf->extract_word.w64 = gf_w64_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w64,gf_w64_extract_word)
|
||||
}
|
||||
|
||||
return 1;
|
||||
|
|
322
src/gf_w8.c
|
@ -9,87 +9,11 @@
|
|||
*/
|
||||
|
||||
#include "gf_int.h"
|
||||
#include "gf_w8.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
|
||||
#define GF_FIELD_WIDTH (8)
|
||||
#define GF_FIELD_SIZE (1 << GF_FIELD_WIDTH)
|
||||
#define GF_HALF_SIZE (1 << (GF_FIELD_WIDTH/2))
|
||||
#define GF_MULT_GROUP_SIZE GF_FIELD_SIZE-1
|
||||
|
||||
#define GF_BASE_FIELD_WIDTH (4)
|
||||
#define GF_BASE_FIELD_SIZE (1 << GF_BASE_FIELD_WIDTH)
|
||||
|
||||
struct gf_w8_logtable_data {
|
||||
uint8_t log_tbl[GF_FIELD_SIZE];
|
||||
uint8_t antilog_tbl[GF_FIELD_SIZE * 2];
|
||||
uint8_t inv_tbl[GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_logzero_table_data {
|
||||
short log_tbl[GF_FIELD_SIZE]; /* Make this signed, so that we can divide easily */
|
||||
uint8_t antilog_tbl[512+512+1];
|
||||
uint8_t *div_tbl;
|
||||
uint8_t *inv_tbl;
|
||||
};
|
||||
|
||||
struct gf_w8_logzero_small_table_data {
|
||||
short log_tbl[GF_FIELD_SIZE]; /* Make this signed, so that we can divide easily */
|
||||
uint8_t antilog_tbl[255*3];
|
||||
uint8_t inv_tbl[GF_FIELD_SIZE];
|
||||
uint8_t *div_tbl;
|
||||
};
|
||||
|
||||
struct gf_w8_composite_data {
|
||||
uint8_t *mult_table;
|
||||
};
|
||||
|
||||
/* Don't change the order of these relative to gf_w8_half_table_data */
|
||||
|
||||
struct gf_w8_default_data {
|
||||
uint8_t high[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
uint8_t low[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
uint8_t divtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t multtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_half_table_data {
|
||||
uint8_t high[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
uint8_t low[GF_FIELD_SIZE][GF_HALF_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_single_table_data {
|
||||
uint8_t divtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t multtable[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_double_table_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[GF_FIELD_SIZE][GF_FIELD_SIZE*GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_double_table_lazy_data {
|
||||
uint8_t div[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint8_t smult[GF_FIELD_SIZE][GF_FIELD_SIZE];
|
||||
uint16_t mult[GF_FIELD_SIZE*GF_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w4_logtable_data {
|
||||
uint8_t log_tbl[GF_BASE_FIELD_SIZE];
|
||||
uint8_t antilog_tbl[GF_BASE_FIELD_SIZE * 2];
|
||||
uint8_t *antilog_tbl_div;
|
||||
};
|
||||
|
||||
struct gf_w4_single_table_data {
|
||||
uint8_t div[GF_BASE_FIELD_SIZE][GF_BASE_FIELD_SIZE];
|
||||
uint8_t mult[GF_BASE_FIELD_SIZE][GF_BASE_FIELD_SIZE];
|
||||
};
|
||||
|
||||
struct gf_w8_bytwo_data {
|
||||
uint64_t prim_poly;
|
||||
uint64_t mask1;
|
||||
uint64_t mask2;
|
||||
};
|
||||
#include <assert.h>
|
||||
#include "gf_cpu.h"
|
||||
|
||||
#define AB2(ip, am1 ,am2, b, t1, t2) {\
|
||||
t1 = (b << 1) & am1;\
|
||||
|
@ -204,6 +128,7 @@ uint32_t gf_w8_matrix (gf_t *gf, uint32_t b)
|
|||
}
|
||||
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -211,8 +136,6 @@ gf_w8_clm_multiply_2 (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -246,10 +169,11 @@ gf_w8_clm_multiply_2 (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8)
|
|||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -257,8 +181,6 @@ gf_w8_clm_multiply_3 (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -285,10 +207,11 @@ gf_w8_clm_multiply_3 (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8)
|
|||
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
|
@ -296,8 +219,6 @@ gf_w8_clm_multiply_4 (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8)
|
|||
{
|
||||
gf_val_32_t rv = 0;
|
||||
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
|
||||
__m128i a, b;
|
||||
__m128i result;
|
||||
__m128i prim_poly;
|
||||
|
@ -325,9 +246,9 @@ gf_w8_clm_multiply_4 (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8)
|
|||
/* Extracts 32 bit value from result. */
|
||||
rv = ((gf_val_32_t)_mm_extract_epi32(result, 0));
|
||||
|
||||
#endif
|
||||
return rv;
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
static
|
||||
|
@ -586,23 +507,29 @@ static
|
|||
int gf_w8_cfm_init(gf_t *gf)
|
||||
{
|
||||
#if defined(INTEL_SSE4_PCLMUL)
|
||||
gf_internal_t *h;
|
||||
if (gf_cpu_supports_intel_pclmul) {
|
||||
gf_internal_t *h;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if ((0xe0 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w8_clm_multiply_2;
|
||||
gf->multiply_region.w32 = gf_w8_clm_multiply_region_from_single_2;
|
||||
}else if ((0xc0 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w8_clm_multiply_3;
|
||||
gf->multiply_region.w32 = gf_w8_clm_multiply_region_from_single_3;
|
||||
}else if ((0x80 & h->prim_poly) == 0){
|
||||
gf->multiply.w32 = gf_w8_clm_multiply_4;
|
||||
gf->multiply_region.w32 = gf_w8_clm_multiply_region_from_single_4;
|
||||
}else{
|
||||
return 0;
|
||||
}
|
||||
return 1;
|
||||
if ((0xe0 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_clm_multiply_2)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_clm_multiply_region_from_single_2)
|
||||
}else if ((0xc0 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_clm_multiply_3)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_clm_multiply_region_from_single_3)
|
||||
}else if ((0x80 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_clm_multiply_4)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_clm_multiply_region_from_single_4)
|
||||
}else{
|
||||
return 0;
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
#elif defined(ARM_NEON)
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
return gf_w8_neon_cfm_init(gf);
|
||||
}
|
||||
#endif
|
||||
|
||||
return 0;
|
||||
|
@ -612,7 +539,7 @@ int gf_w8_cfm_init(gf_t *gf)
|
|||
static
|
||||
int gf_w8_shift_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w32 = gf_w8_shift_multiply; /* The others will be set automatically */
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_shift_multiply) /* The others will be set automatically */
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -884,20 +811,20 @@ int gf_w8_log_init(gf_t *gf)
|
|||
} while (i != 1);
|
||||
|
||||
if (h->mult_type == GF_MULT_LOG_TABLE) {
|
||||
gf->inverse.w32 = gf_w8_log_inverse;
|
||||
gf->divide.w32 = gf_w8_log_divide;
|
||||
gf->multiply.w32 = gf_w8_log_multiply;
|
||||
gf->multiply_region.w32 = gf_w8_log_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w8_log_inverse)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_log_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_log_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_log_multiply_region)
|
||||
} else if (h->mult_type == GF_MULT_LOG_ZERO) {
|
||||
gf->inverse.w32 = gf_w8_logzero_small_inverse;
|
||||
gf->divide.w32 = gf_w8_logzero_small_divide;
|
||||
gf->multiply.w32 = gf_w8_logzero_small_multiply;
|
||||
gf->multiply_region.w32 = gf_w8_logzero_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w8_logzero_small_inverse)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_logzero_small_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_logzero_small_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_logzero_multiply_region)
|
||||
} else {
|
||||
gf->inverse.w32 = gf_w8_logzero_inverse;
|
||||
gf->divide.w32 = gf_w8_logzero_divide;
|
||||
gf->multiply.w32 = gf_w8_logzero_multiply;
|
||||
gf->multiply_region.w32 = gf_w8_logzero_multiply_region;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w8_logzero_inverse)
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_logzero_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_logzero_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_logzero_multiply_region)
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
@ -938,7 +865,7 @@ gf_w8_default_multiply(gf_t *gf, gf_val_32_t a, gf_val_32_t b)
|
|||
return (ftd->multtable[a][b]);
|
||||
}
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
#if defined(INTEL_SSSE3) || defined(ARM_NEON)
|
||||
static
|
||||
gf_val_32_t
|
||||
gf_w8_default_divide(gf_t *gf, gf_val_32_t a, gf_val_32_t b)
|
||||
|
@ -1177,17 +1104,22 @@ int gf_w8_split_init(gf_t *gf)
|
|||
}
|
||||
}
|
||||
|
||||
gf->multiply.w32 = gf_w8_split_multiply;
|
||||
|
||||
#ifdef INTEL_SSSE3
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w8_split_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w8_split_multiply_region_sse;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w8_split_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_split_multiply)
|
||||
|
||||
#if defined(INTEL_SSSE3)
|
||||
if (gf_cpu_supports_intel_ssse3 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_split_multiply_region_sse)
|
||||
} else {
|
||||
#elif defined(ARM_NEON)
|
||||
if (gf_cpu_supports_arm_neon && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
gf_w8_neon_split_init(gf);
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_split_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#if defined(INTEL_SSSE3) || defined(ARM_NEON)
|
||||
}
|
||||
#endif
|
||||
|
||||
return 1;
|
||||
|
@ -1205,16 +1137,12 @@ int gf_w8_table_init(gf_t *gf)
|
|||
struct gf_w8_double_table_data *dtd = NULL;
|
||||
struct gf_w8_double_table_lazy_data *ltd = NULL;
|
||||
struct gf_w8_default_data *dd = NULL;
|
||||
int a, b, c, prod, scase, issse;
|
||||
int a, b, c, prod, scase;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
issse = 0;
|
||||
#ifdef INTEL_SSSE3
|
||||
issse = 1;
|
||||
#endif
|
||||
|
||||
if (h->mult_type == GF_MULT_DEFAULT && issse) {
|
||||
if (h->mult_type == GF_MULT_DEFAULT &&
|
||||
(gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon)) {
|
||||
dd = (struct gf_w8_default_data *)h->private;
|
||||
scase = 3;
|
||||
bzero(dd->high, sizeof(uint8_t) * GF_FIELD_SIZE * GF_HALF_SIZE);
|
||||
|
@ -1239,7 +1167,7 @@ int gf_w8_table_init(gf_t *gf)
|
|||
scase = 2;
|
||||
} else {
|
||||
fprintf(stderr, "Internal error in gf_w8_table_init\n");
|
||||
exit(0);
|
||||
assert(0);
|
||||
}
|
||||
|
||||
for (a = 1; a < GF_FIELD_SIZE; a++) {
|
||||
|
@ -1271,28 +1199,38 @@ int gf_w8_table_init(gf_t *gf)
|
|||
}
|
||||
}
|
||||
|
||||
gf->inverse.w32 = NULL; /* Will set from divide */
|
||||
SET_FUNCTION(gf,inverse,w32,NULL) /* Will set from divide */
|
||||
switch (scase) {
|
||||
case 0:
|
||||
gf->divide.w32 = gf_w8_table_divide;
|
||||
gf->multiply.w32 = gf_w8_table_multiply;
|
||||
gf->multiply_region.w32 = gf_w8_table_multiply_region;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_table_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_table_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_table_multiply_region)
|
||||
break;
|
||||
case 1:
|
||||
gf->divide.w32 = gf_w8_double_table_divide;
|
||||
gf->multiply.w32 = gf_w8_double_table_multiply;
|
||||
gf->multiply_region.w32 = gf_w8_double_table_multiply_region;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_double_table_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_double_table_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_double_table_multiply_region)
|
||||
break;
|
||||
case 2:
|
||||
gf->divide.w32 = gf_w8_double_table_lazy_divide;
|
||||
gf->multiply.w32 = gf_w8_double_table_lazy_multiply;
|
||||
gf->multiply_region.w32 = gf_w8_double_table_multiply_region;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_double_table_lazy_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_double_table_lazy_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_double_table_multiply_region)
|
||||
break;
|
||||
case 3:
|
||||
#ifdef INTEL_SSSE3
|
||||
gf->divide.w32 = gf_w8_default_divide;
|
||||
gf->multiply.w32 = gf_w8_default_multiply;
|
||||
gf->multiply_region.w32 = gf_w8_split_multiply_region_sse;
|
||||
#if defined(INTEL_SSSE3) || defined(ARM_NEON)
|
||||
if (gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon) {
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_default_divide)
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_default_multiply)
|
||||
#if defined(INTEL_SSSE3)
|
||||
if (gf_cpu_supports_intel_ssse3) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_split_multiply_region_sse)
|
||||
}
|
||||
#elif defined(ARM_NEON)
|
||||
if (gf_cpu_supports_arm_neon) {
|
||||
gf_w8_neon_split_init(gf);
|
||||
}
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
break;
|
||||
}
|
||||
|
@ -1538,18 +1476,18 @@ int gf_w8_composite_init(gf_t *gf)
|
|||
cd->mult_table = gf_w4_get_mult_table(h->base_gf);
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP) {
|
||||
gf->multiply_region.w32 = gf_w8_composite_multiply_region_alt;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_composite_multiply_region_alt)
|
||||
} else {
|
||||
gf->multiply_region.w32 = gf_w8_composite_multiply_region;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_composite_multiply_region)
|
||||
}
|
||||
|
||||
if (cd->mult_table == NULL) {
|
||||
gf->multiply.w32 = gf_w8_composite_multiply_recursive;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_composite_multiply_recursive)
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w8_composite_multiply_inline;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_composite_multiply_inline)
|
||||
}
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = gf_w8_composite_inverse;
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w8_composite_inverse)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
@ -2256,28 +2194,30 @@ int gf_w8_bytwo_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (h->mult_type == GF_MULT_BYTWO_p) {
|
||||
gf->multiply.w32 = gf_w8_bytwo_p_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_bytwo_p_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w8_bytwo_p_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w8_bytwo_p_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w8_bytwo_p_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
return 0;
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_bytwo_p_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_bytwo_p_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
gf->multiply.w32 = gf_w8_bytwo_b_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_bytwo_b_multiply)
|
||||
#ifdef INTEL_SSE2
|
||||
if (h->region_type & GF_REGION_NOSSE)
|
||||
gf->multiply_region.w32 = gf_w8_bytwo_b_nosse_multiply_region;
|
||||
else
|
||||
gf->multiply_region.w32 = gf_w8_bytwo_b_sse_multiply_region;
|
||||
#else
|
||||
gf->multiply_region.w32 = gf_w8_bytwo_b_nosse_multiply_region;
|
||||
if(h->region_type & GF_REGION_SSE)
|
||||
if (gf_cpu_supports_intel_sse2 && !(h->region_type & GF_REGION_NOSIMD)) {
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_bytwo_b_sse_multiply_region)
|
||||
} else {
|
||||
#endif
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_bytwo_b_nosse_multiply_region)
|
||||
if(h->region_type & GF_REGION_SIMD)
|
||||
return 0;
|
||||
#ifdef INTEL_SSE2
|
||||
}
|
||||
#endif
|
||||
}
|
||||
return 1;
|
||||
|
@ -2295,9 +2235,9 @@ int gf_w8_scratch_size(int mult_type, int region_type, int divide_type, int arg1
|
|||
switch(mult_type)
|
||||
{
|
||||
case GF_MULT_DEFAULT:
|
||||
#ifdef INTEL_SSSE3
|
||||
return sizeof(gf_internal_t) + sizeof(struct gf_w8_default_data) + 64;
|
||||
#endif
|
||||
if (gf_cpu_supports_intel_ssse3 || gf_cpu_supports_arm_neon) {
|
||||
return sizeof(gf_internal_t) + sizeof(struct gf_w8_default_data) + 64;
|
||||
}
|
||||
return sizeof(gf_internal_t) + sizeof(struct gf_w8_single_table_data) + 64;
|
||||
case GF_MULT_TABLE:
|
||||
if (region_type == GF_REGION_CAUCHY) {
|
||||
|
@ -2370,11 +2310,11 @@ int gf_w8_init(gf_t *gf)
|
|||
h->prim_poly |= 0x100;
|
||||
}
|
||||
|
||||
gf->multiply.w32 = NULL;
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->multiply_region.w32 = NULL;
|
||||
gf->extract_word.w32 = gf_w8_extract_word;
|
||||
SET_FUNCTION(gf,multiply,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w32,NULL)
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w8_extract_word)
|
||||
|
||||
switch(h->mult_type) {
|
||||
case GF_MULT_DEFAULT:
|
||||
|
@ -2392,31 +2332,31 @@ int gf_w8_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (h->divide_type == GF_DIVIDE_EUCLID) {
|
||||
gf->divide.w32 = gf_w8_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w8_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w8_euclid)
|
||||
} else if (h->divide_type == GF_DIVIDE_MATRIX) {
|
||||
gf->divide.w32 = gf_w8_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_w8_matrix;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_w8_matrix)
|
||||
}
|
||||
|
||||
if (gf->divide.w32 == NULL) {
|
||||
gf->divide.w32 = gf_w8_divide_from_inverse;
|
||||
if (gf->inverse.w32 == NULL) gf->inverse.w32 = gf_w8_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_w8_divide_from_inverse)
|
||||
if (gf->inverse.w32 == NULL) SET_FUNCTION(gf,inverse,w32,gf_w8_euclid)
|
||||
}
|
||||
|
||||
if (gf->inverse.w32 == NULL) gf->inverse.w32 = gf_w8_inverse_from_divide;
|
||||
if (gf->inverse.w32 == NULL) SET_FUNCTION(gf,inverse,w32,gf_w8_inverse_from_divide)
|
||||
|
||||
if (h->mult_type == GF_MULT_COMPOSITE && (h->region_type & GF_REGION_ALTMAP)) {
|
||||
gf->extract_word.w32 = gf_w8_composite_extract_word;
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_w8_composite_extract_word)
|
||||
}
|
||||
|
||||
if (h->region_type == GF_REGION_CAUCHY) {
|
||||
gf->multiply_region.w32 = gf_wgen_cauchy_region;
|
||||
gf->extract_word.w32 = gf_wgen_extract_word;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_wgen_cauchy_region)
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_wgen_extract_word)
|
||||
}
|
||||
|
||||
if (gf->multiply_region.w32 == NULL) {
|
||||
gf->multiply_region.w32 = gf_w8_multiply_region_from_single;
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_multiply_region_from_single)
|
||||
}
|
||||
|
||||
return 1;
|
||||
|
|
100
src/gf_wgen.c
|
@ -166,10 +166,10 @@ gf_wgen_shift_multiply (gf_t *gf, uint32_t a32, uint32_t b32)
|
|||
|
||||
product = 0;
|
||||
|
||||
for (i = 0; i < h->w; i++) {
|
||||
for (i = 0; i < (uint64_t)h->w; i++) {
|
||||
if (a & (one << i)) product ^= (b << i);
|
||||
}
|
||||
for (i = h->w*2-1; i >= h->w; i--) {
|
||||
for (i = h->w*2-1; i >= (uint64_t)h->w; i--) {
|
||||
if (product & (one << i)) product ^= (pp << (i-h->w));
|
||||
}
|
||||
return product;
|
||||
|
@ -178,8 +178,8 @@ gf_wgen_shift_multiply (gf_t *gf, uint32_t a32, uint32_t b32)
|
|||
static
|
||||
int gf_wgen_shift_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w32 = gf_wgen_shift_multiply;
|
||||
gf->inverse.w32 = gf_wgen_euclid;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_shift_multiply)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_wgen_euclid)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -211,8 +211,8 @@ gf_wgen_bytwo_b_multiply (gf_t *gf, gf_val_32_t a, gf_val_32_t b)
|
|||
static
|
||||
int gf_wgen_bytwo_b_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w32 = gf_wgen_bytwo_b_multiply;
|
||||
gf->inverse.w32 = gf_wgen_euclid;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_bytwo_b_multiply)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_wgen_euclid)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -247,8 +247,8 @@ gf_wgen_bytwo_p_multiply (gf_t *gf, gf_val_32_t a, gf_val_32_t b)
|
|||
static
|
||||
int gf_wgen_bytwo_p_init(gf_t *gf)
|
||||
{
|
||||
gf->multiply.w32 = gf_wgen_bytwo_p_multiply;
|
||||
gf->inverse.w32 = gf_wgen_euclid;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_bytwo_p_multiply)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_wgen_euclid)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -256,7 +256,7 @@ static
|
|||
void
|
||||
gf_wgen_group_set_shift_tables(uint32_t *shift, uint32_t val, gf_internal_t *h)
|
||||
{
|
||||
int i;
|
||||
uint32_t i;
|
||||
uint32_t j;
|
||||
int g_s;
|
||||
|
||||
|
@ -268,7 +268,7 @@ gf_wgen_group_set_shift_tables(uint32_t *shift, uint32_t val, gf_internal_t *h)
|
|||
|
||||
shift[0] = 0;
|
||||
|
||||
for (i = 1; i < (1 << g_s); i <<= 1) {
|
||||
for (i = 1; i < ((uint32_t)1 << g_s); i <<= 1) {
|
||||
for (j = 0; j < i; j++) shift[i|j] = shift[j]^val;
|
||||
if (val & (1 << (h->w-1))) {
|
||||
val <<= 1;
|
||||
|
@ -417,7 +417,7 @@ int gf_wgen_group_init(gf_t *gf)
|
|||
uint32_t i, j, p, index;
|
||||
struct gf_wgen_group_data *gd;
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
int g_s, g_r;
|
||||
uint32_t g_s, g_r;
|
||||
|
||||
if (h->mult_type == GF_MULT_DEFAULT) {
|
||||
g_s = 2;
|
||||
|
@ -440,7 +440,7 @@ int gf_wgen_group_init(gf_t *gf)
|
|||
gd->tshift = ((gd->tshift-1)/g_r) * g_r;
|
||||
|
||||
gd->reduce[0] = 0;
|
||||
for (i = 0; i < (1 << g_r); i++) {
|
||||
for (i = 0; i < ((uint32_t)1 << g_r); i++) {
|
||||
p = 0;
|
||||
index = 0;
|
||||
for (j = 0; j < g_r; j++) {
|
||||
|
@ -453,12 +453,12 @@ int gf_wgen_group_init(gf_t *gf)
|
|||
}
|
||||
|
||||
if (g_s == g_r) {
|
||||
gf->multiply.w32 = gf_wgen_group_s_equals_r_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_group_s_equals_r_multiply)
|
||||
} else {
|
||||
gf->multiply.w32 = gf_wgen_group_multiply;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_group_multiply)
|
||||
}
|
||||
gf->divide.w32 = NULL;
|
||||
gf->divide.w32 = NULL;
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -504,23 +504,23 @@ int gf_wgen_table_8_init(gf_t *gf)
|
|||
std->mult = &(std->base);
|
||||
std->div = std->mult + ((1<<h->w)*(1<<h->w));
|
||||
|
||||
for (a = 0; a < (1 << w); a++) {
|
||||
for (a = 0; a < ((uint32_t)1 << w); a++) {
|
||||
std->mult[a] = 0;
|
||||
std->mult[a<<w] = 0;
|
||||
std->div[a] = 0;
|
||||
std->div[a<<w] = 0;
|
||||
}
|
||||
|
||||
for (a = 1; a < (1 << w); a++) {
|
||||
for (b = 1; b < (1 << w); b++) {
|
||||
for (a = 1; a < ((uint32_t)1 << w); a++) {
|
||||
for (b = 1; b < ((uint32_t)1 << w); b++) {
|
||||
p = gf_wgen_shift_multiply(gf, a, b);
|
||||
std->mult[(a<<w)|b] = p;
|
||||
std->div[(p<<w)|a] = b;
|
||||
}
|
||||
}
|
||||
|
||||
gf->multiply.w32 = gf_wgen_table_8_multiply;
|
||||
gf->divide.w32 = gf_wgen_table_8_divide;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_table_8_multiply)
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_table_8_divide)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -565,23 +565,23 @@ int gf_wgen_table_16_init(gf_t *gf)
|
|||
std->mult = &(std->base);
|
||||
std->div = std->mult + ((1<<h->w)*(1<<h->w));
|
||||
|
||||
for (a = 0; a < (1 << w); a++) {
|
||||
for (a = 0; a < ((uint32_t)1 << w); a++) {
|
||||
std->mult[a] = 0;
|
||||
std->mult[a<<w] = 0;
|
||||
std->div[a] = 0;
|
||||
std->div[a<<w] = 0;
|
||||
}
|
||||
|
||||
for (a = 1; a < (1 << w); a++) {
|
||||
for (b = 1; b < (1 << w); b++) {
|
||||
for (a = 1; a < ((uint32_t)1 << w); a++) {
|
||||
for (b = 1; b < ((uint32_t)1 << w); b++) {
|
||||
p = gf_wgen_shift_multiply(gf, a, b);
|
||||
std->mult[(a<<w)|b] = p;
|
||||
std->div[(p<<w)|a] = b;
|
||||
}
|
||||
}
|
||||
|
||||
gf->multiply.w32 = gf_wgen_table_16_multiply;
|
||||
gf->divide.w32 = gf_wgen_table_16_divide;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_table_16_multiply)
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_table_16_divide)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -649,11 +649,11 @@ int gf_wgen_log_8_init(gf_t *gf)
|
|||
std->anti = std->log + (1<<h->w);
|
||||
std->danti = std->anti + (1<<h->w)-1;
|
||||
|
||||
for (i = 0; i < (1 << w); i++)
|
||||
for (i = 0; i < ((uint32_t)1 << w); i++)
|
||||
std->log[i] = 0;
|
||||
|
||||
a = 1;
|
||||
for(i=0; i < (1<<w)-1; i++)
|
||||
for(i=0; i < ((uint32_t)1<<w)-1; i++)
|
||||
{
|
||||
if (std->log[a] != 0) check = 1;
|
||||
std->log[a] = i;
|
||||
|
@ -670,8 +670,8 @@ int gf_wgen_log_8_init(gf_t *gf)
|
|||
return 0;
|
||||
}
|
||||
|
||||
gf->multiply.w32 = gf_wgen_log_8_multiply;
|
||||
gf->divide.w32 = gf_wgen_log_8_divide;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_log_8_multiply)
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_log_8_divide)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -724,11 +724,11 @@ int gf_wgen_log_16_init(gf_t *gf)
|
|||
std->anti = std->log + (1<<h->w);
|
||||
std->danti = std->anti + (1<<h->w)-1;
|
||||
|
||||
for (i = 0; i < (1 << w); i++)
|
||||
for (i = 0; i < ((uint32_t)1 << w); i++)
|
||||
std->log[i] = 0;
|
||||
|
||||
a = 1;
|
||||
for(i=0; i < (1<<w)-1; i++)
|
||||
for(i=0; i < ((uint32_t)1<<w)-1; i++)
|
||||
{
|
||||
if (std->log[a] != 0) check = 1;
|
||||
std->log[a] = i;
|
||||
|
@ -746,8 +746,8 @@ int gf_wgen_log_16_init(gf_t *gf)
|
|||
return 0;
|
||||
}
|
||||
|
||||
gf->multiply.w32 = gf_wgen_log_16_multiply;
|
||||
gf->divide.w32 = gf_wgen_log_16_divide;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_log_16_multiply)
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_log_16_divide)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -800,11 +800,11 @@ int gf_wgen_log_32_init(gf_t *gf)
|
|||
std->anti = std->log + (1<<h->w);
|
||||
std->danti = std->anti + (1<<h->w)-1;
|
||||
|
||||
for (i = 0; i < (1 << w); i++)
|
||||
for (i = 0; i < ((uint32_t)1 << w); i++)
|
||||
std->log[i] = 0;
|
||||
|
||||
a = 1;
|
||||
for(i=0; i < (1<<w)-1; i++)
|
||||
for(i=0; i < ((uint32_t)1<<w)-1; i++)
|
||||
{
|
||||
if (std->log[a] != 0) check = 1;
|
||||
std->log[a] = i;
|
||||
|
@ -821,8 +821,8 @@ int gf_wgen_log_32_init(gf_t *gf)
|
|||
return 0;
|
||||
}
|
||||
|
||||
gf->multiply.w32 = gf_wgen_log_32_multiply;
|
||||
gf->divide.w32 = gf_wgen_log_32_divide;
|
||||
SET_FUNCTION(gf,multiply,w32,gf_wgen_log_32_multiply)
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_log_32_divide)
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
@ -975,11 +975,11 @@ int gf_wgen_init(gf_t *gf)
|
|||
}
|
||||
}
|
||||
|
||||
gf->multiply.w32 = NULL;
|
||||
gf->divide.w32 = NULL;
|
||||
gf->inverse.w32 = NULL;
|
||||
gf->multiply_region.w32 = gf_wgen_cauchy_region;
|
||||
gf->extract_word.w32 = gf_wgen_extract_word;
|
||||
SET_FUNCTION(gf,multiply,w32,NULL)
|
||||
SET_FUNCTION(gf,divide,w32,NULL)
|
||||
SET_FUNCTION(gf,inverse,w32,NULL)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_wgen_cauchy_region)
|
||||
SET_FUNCTION(gf,extract_word,w32,gf_wgen_extract_word)
|
||||
|
||||
switch(h->mult_type) {
|
||||
case GF_MULT_DEFAULT:
|
||||
|
@ -1000,20 +1000,20 @@ int gf_wgen_init(gf_t *gf)
|
|||
default: return 0;
|
||||
}
|
||||
if (h->divide_type == GF_DIVIDE_EUCLID) {
|
||||
gf->divide.w32 = gf_wgen_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_wgen_euclid;
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_wgen_euclid)
|
||||
} else if (h->divide_type == GF_DIVIDE_MATRIX) {
|
||||
gf->divide.w32 = gf_wgen_divide_from_inverse;
|
||||
gf->inverse.w32 = gf_wgen_matrix;
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_divide_from_inverse)
|
||||
SET_FUNCTION(gf,inverse,w32,gf_wgen_matrix)
|
||||
}
|
||||
|
||||
if (gf->inverse.w32== NULL && gf->divide.w32 == NULL) gf->inverse.w32 = gf_wgen_euclid;
|
||||
if (gf->inverse.w32== NULL && gf->divide.w32 == NULL) SET_FUNCTION(gf,inverse,w32,gf_wgen_euclid)
|
||||
|
||||
if (gf->inverse.w32 != NULL && gf->divide.w32 == NULL) {
|
||||
gf->divide.w32 = gf_wgen_divide_from_inverse;
|
||||
SET_FUNCTION(gf,divide,w32,gf_wgen_divide_from_inverse)
|
||||
}
|
||||
if (gf->inverse.w32 == NULL && gf->divide.w32 != NULL) {
|
||||
gf->inverse.w32 = gf_wgen_inverse_from_divide;
|
||||
SET_FUNCTION(gf,inverse,w32,gf_wgen_inverse_from_divide)
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
|
|
@ -0,0 +1,276 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* Copyright (c) 2014: Janne Grunau <j@jannau.net>
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions
|
||||
* are met:
|
||||
*
|
||||
* - Redistributions of source code must retain the above copyright
|
||||
* notice, this list of conditions and the following disclaimer.
|
||||
*
|
||||
* - Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in
|
||||
* the documentation and/or other materials provided with the
|
||||
* distribution.
|
||||
*
|
||||
* - Neither the name of the University of Tennessee nor the names of its
|
||||
* contributors may be used to endorse or promote products derived
|
||||
* from this software without specific prior written permission.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||||
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||||
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||||
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
||||
* HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
||||
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
||||
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
|
||||
* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
|
||||
* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
||||
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY
|
||||
* WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
* POSSIBILITY OF SUCH DAMAGE.
|
||||
*
|
||||
*
|
||||
* gf_w16_neon.c
|
||||
*
|
||||
* Neon routines for 16-bit Galois fields
|
||||
*
|
||||
*/
|
||||
|
||||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include "gf_w16.h"
|
||||
|
||||
#ifndef ARCH_AARCH64
|
||||
#define vqtbl1q_u8(tbl, v) vcombine_u8(vtbl2_u8(tbl, vget_low_u8(v)), \
|
||||
vtbl2_u8(tbl, vget_high_u8(v)))
|
||||
#endif
|
||||
|
||||
static
|
||||
inline
|
||||
void
|
||||
neon_w16_split_4_multiply_region(gf_t *gf, uint16_t *src, uint16_t *dst,
|
||||
uint16_t *d_end, uint8_t *tbl,
|
||||
gf_val_32_t val, int xor)
|
||||
{
|
||||
unsigned i;
|
||||
uint8_t *high = tbl + 4 * 16;
|
||||
uint8x16_t loset, rl, rh;
|
||||
uint8x16x2_t va;
|
||||
|
||||
#ifdef ARCH_AARCH64
|
||||
uint8x16_t tbl_h[4], tbl_l[4];
|
||||
for (i = 0; i < 4; i++) {
|
||||
tbl_l[i] = vld1q_u8(tbl + i*16);
|
||||
tbl_h[i] = vld1q_u8(high + i*16);
|
||||
}
|
||||
#else
|
||||
uint8x8x2_t tbl_h[4], tbl_l[4];
|
||||
for (i = 0; i < 4; i++) {
|
||||
tbl_l[i].val[0] = vld1_u8(tbl + i*16);
|
||||
tbl_l[i].val[1] = vld1_u8(tbl + i*16 + 8);
|
||||
tbl_h[i].val[0] = vld1_u8(high + i*16);
|
||||
tbl_h[i].val[1] = vld1_u8(high + i*16 + 8);
|
||||
}
|
||||
#endif
|
||||
|
||||
loset = vdupq_n_u8(0xf);
|
||||
|
||||
if (xor) {
|
||||
uint8x16x2_t vb;
|
||||
while (dst < d_end) {
|
||||
va = vld2q_u8((uint8_t*)src);
|
||||
vb = vld2q_u8((uint8_t*)dst);
|
||||
|
||||
rl = vqtbl1q_u8(tbl_l[0], vandq_u8(va.val[0], loset));
|
||||
rh = vqtbl1q_u8(tbl_h[0], vandq_u8(va.val[0], loset));
|
||||
rl = veorq_u8(rl, vqtbl1q_u8(tbl_l[2], vandq_u8(va.val[1], loset)));
|
||||
rh = veorq_u8(rh, vqtbl1q_u8(tbl_h[2], vandq_u8(va.val[1], loset)));
|
||||
|
||||
va.val[0] = vshrq_n_u8(va.val[0], 4);
|
||||
va.val[1] = vshrq_n_u8(va.val[1], 4);
|
||||
|
||||
rl = veorq_u8(rl, vqtbl1q_u8(tbl_l[1], va.val[0]));
|
||||
rh = veorq_u8(rh, vqtbl1q_u8(tbl_h[1], va.val[0]));
|
||||
va.val[0] = veorq_u8(rl, vqtbl1q_u8(tbl_l[3], va.val[1]));
|
||||
va.val[1] = veorq_u8(rh, vqtbl1q_u8(tbl_h[3], va.val[1]));
|
||||
|
||||
va.val[0] = veorq_u8(va.val[0], vb.val[0]);
|
||||
va.val[1] = veorq_u8(va.val[1], vb.val[1]);
|
||||
vst2q_u8((uint8_t*)dst, va);
|
||||
|
||||
src += 16;
|
||||
dst += 16;
|
||||
}
|
||||
} else {
|
||||
while (dst < d_end) {
|
||||
va = vld2q_u8((uint8_t*)src);
|
||||
|
||||
rl = vqtbl1q_u8(tbl_l[0], vandq_u8(va.val[0], loset));
|
||||
rh = vqtbl1q_u8(tbl_h[0], vandq_u8(va.val[0], loset));
|
||||
rl = veorq_u8(rl, vqtbl1q_u8(tbl_l[2], vandq_u8(va.val[1], loset)));
|
||||
rh = veorq_u8(rh, vqtbl1q_u8(tbl_h[2], vandq_u8(va.val[1], loset)));
|
||||
|
||||
va.val[0] = vshrq_n_u8(va.val[0], 4);
|
||||
va.val[1] = vshrq_n_u8(va.val[1], 4);
|
||||
|
||||
rl = veorq_u8(rl, vqtbl1q_u8(tbl_l[1], va.val[0]));
|
||||
rh = veorq_u8(rh, vqtbl1q_u8(tbl_h[1], va.val[0]));
|
||||
va.val[0] = veorq_u8(rl, vqtbl1q_u8(tbl_l[3], va.val[1]));
|
||||
va.val[1] = veorq_u8(rh, vqtbl1q_u8(tbl_h[3], va.val[1]));
|
||||
|
||||
vst2q_u8((uint8_t*)dst, va);
|
||||
|
||||
src += 16;
|
||||
dst += 16;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static
|
||||
inline
|
||||
void
|
||||
neon_w16_split_4_altmap_multiply_region(gf_t *gf, uint8_t *src,
|
||||
uint8_t *dst, uint8_t *d_end,
|
||||
uint8_t *tbl, gf_val_32_t val,
|
||||
int xor)
|
||||
{
|
||||
unsigned i;
|
||||
uint8_t *high = tbl + 4 * 16;
|
||||
uint8x16_t vh, vl, rh, rl;
|
||||
uint8x16_t loset;
|
||||
|
||||
#ifdef ARCH_AARCH64
|
||||
uint8x16_t tbl_h[4], tbl_l[4];
|
||||
#else
|
||||
uint8x8x2_t tbl_h[4], tbl_l[4];
|
||||
#endif
|
||||
for (i = 0; i < 4; i++) {
|
||||
#ifdef ARCH_AARCH64
|
||||
tbl_l[i] = vld1q_u8(tbl + i*16);
|
||||
tbl_h[i] = vld1q_u8(high + i*16);
|
||||
#else
|
||||
tbl_l[i].val[0] = vld1_u8(tbl + i*16);
|
||||
tbl_l[i].val[1] = vld1_u8(tbl + i*16 + 8);
|
||||
tbl_h[i].val[0] = vld1_u8(high + i*16);
|
||||
tbl_h[i].val[1] = vld1_u8(high + i*16 + 8);
|
||||
#endif
|
||||
}
|
||||
|
||||
loset = vdupq_n_u8(0xf);
|
||||
|
||||
while (dst < d_end) {
|
||||
vh = vld1q_u8(src);
|
||||
vl = vld1q_u8(src + 16);
|
||||
|
||||
rl = vqtbl1q_u8(tbl_l[0], vandq_u8(vl, loset));
|
||||
rh = vqtbl1q_u8(tbl_h[0], vandq_u8(vl, loset));
|
||||
rl = veorq_u8(rl, vqtbl1q_u8(tbl_l[2], vandq_u8(vh, loset)));
|
||||
rh = veorq_u8(rh, vqtbl1q_u8(tbl_h[2], vandq_u8(vh, loset)));
|
||||
|
||||
vl = vshrq_n_u8(vl, 4);
|
||||
vh = vshrq_n_u8(vh, 4);
|
||||
|
||||
rl = veorq_u8(rl, vqtbl1q_u8(tbl_l[1], vl));
|
||||
rh = veorq_u8(rh, vqtbl1q_u8(tbl_h[1], vl));
|
||||
rl = veorq_u8(rl, vqtbl1q_u8(tbl_l[3], vh));
|
||||
rh = veorq_u8(rh, vqtbl1q_u8(tbl_h[3], vh));
|
||||
|
||||
if (xor) {
|
||||
vh = vld1q_u8(dst);
|
||||
vl = vld1q_u8(dst + 16);
|
||||
rh = veorq_u8(rh, vh);
|
||||
rl = veorq_u8(rl, vl);
|
||||
}
|
||||
vst1q_u8(dst, rh);
|
||||
vst1q_u8(dst + 16, rl);
|
||||
|
||||
src += 32;
|
||||
dst += 32;
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
|
||||
static
|
||||
inline
|
||||
void
|
||||
neon_w16_split_4_16_lazy_multiply_region(gf_t *gf, void *src, void *dest,
|
||||
gf_val_32_t val, int bytes, int xor,
|
||||
int altmap)
|
||||
{
|
||||
gf_region_data rd;
|
||||
unsigned i, j;
|
||||
uint64_t c, prod;
|
||||
uint8_t tbl[2 * 4 * 16];
|
||||
uint8_t *high = tbl + 4 * 16;
|
||||
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; }
|
||||
if (val == 1) { gf_multby_one(src, dest, bytes, xor); return; }
|
||||
|
||||
for (i = 0; i < 4; i++) {
|
||||
for (j = 0; j < 16; j++) {
|
||||
c = (j << (i*4));
|
||||
prod = gf->multiply.w32(gf, c, val);
|
||||
tbl[i*16 + j] = prod & 0xff;
|
||||
high[i*16 + j] = prod >> 8;
|
||||
}
|
||||
}
|
||||
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, val, xor, 32);
|
||||
gf_do_initial_region_alignment(&rd);
|
||||
|
||||
if (altmap) {
|
||||
uint8_t *s8 = rd.s_start;
|
||||
uint8_t *d8 = rd.d_start;
|
||||
uint8_t *end8 = rd.d_top;
|
||||
if (xor)
|
||||
neon_w16_split_4_altmap_multiply_region(gf, s8, d8, end8, tbl, val, 1);
|
||||
else
|
||||
neon_w16_split_4_altmap_multiply_region(gf, s8, d8, end8, tbl, val, 0);
|
||||
} else {
|
||||
uint16_t *s16 = rd.s_start;
|
||||
uint16_t *d16 = rd.d_start;
|
||||
uint16_t *end16 = rd.d_top;
|
||||
if (xor)
|
||||
neon_w16_split_4_multiply_region(gf, s16, d16, end16, tbl, val, 1);
|
||||
else
|
||||
neon_w16_split_4_multiply_region(gf, s16, d16, end16, tbl, val, 0);
|
||||
}
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w16_split_4_16_lazy_multiply_region_neon(gf_t *gf, void *src, void *dest,
|
||||
gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
neon_w16_split_4_16_lazy_multiply_region(gf, src, dest, val, bytes, xor, 0);
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w16_split_4_16_lazy_altmap_multiply_region_neon(gf_t *gf, void *src,
|
||||
void *dest,
|
||||
gf_val_32_t val, int bytes,
|
||||
int xor)
|
||||
{
|
||||
neon_w16_split_4_16_lazy_multiply_region(gf, src, dest, val, bytes, xor, 1);
|
||||
}
|
||||
|
||||
|
||||
void gf_w16_neon_split_init(gf_t *gf)
|
||||
{
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_altmap_multiply_region_neon)
|
||||
else
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w16_split_4_16_lazy_multiply_region_neon)
|
||||
}
|
|
@ -0,0 +1,269 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* Copyright (c) 2014: Janne Grunau <j@jannau.net>
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions
|
||||
* are met:
|
||||
*
|
||||
* - Redistributions of source code must retain the above copyright
|
||||
* notice, this list of conditions and the following disclaimer.
|
||||
*
|
||||
* - Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in
|
||||
* the documentation and/or other materials provided with the
|
||||
* distribution.
|
||||
*
|
||||
* - Neither the name of the University of Tennessee nor the names of its
|
||||
* contributors may be used to endorse or promote products derived
|
||||
* from this software without specific prior written permission.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||||
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||||
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||||
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
||||
* HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
||||
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
||||
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
|
||||
* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
|
||||
* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
||||
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY
|
||||
* WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
* POSSIBILITY OF SUCH DAMAGE.
|
||||
*
|
||||
* gf_w32_neon.c
|
||||
*
|
||||
* Neon routines for 32-bit Galois fields
|
||||
*
|
||||
*/
|
||||
|
||||
|
||||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include "gf_w32.h"
|
||||
|
||||
#ifndef ARCH_AARCH64
|
||||
#define vqtbl1q_u8(tbl, v) vcombine_u8(vtbl2_u8(tbl, vget_low_u8(v)), \
|
||||
vtbl2_u8(tbl, vget_high_u8(v)))
|
||||
#endif
|
||||
|
||||
static
|
||||
void
|
||||
neon_w32_split_4_32_multiply_region(gf_t *gf, uint32_t *src, uint32_t *dst,
|
||||
uint32_t *d_end, uint8_t btable[8][4][16],
|
||||
uint32_t val, int xor, int altmap)
|
||||
{
|
||||
int i, j;
|
||||
#ifdef ARCH_AARCH64
|
||||
uint8x16_t tables[8][4];
|
||||
#else
|
||||
uint8x8x2_t tables[8][4];
|
||||
#endif
|
||||
uint32x4_t v0, v1, v2, v3, s0, s1, s2, s3;
|
||||
uint8x16_t p0, p1, p2, p3, si, mask1;
|
||||
uint16x8x2_t r0, r1;
|
||||
uint8x16x2_t q0, q1;
|
||||
|
||||
for (i = 0; i < 8; i++) {
|
||||
for (j = 0; j < 4; j++) {
|
||||
#ifdef ARCH_AARCH64
|
||||
tables[i][j] = vld1q_u8(btable[i][j]);
|
||||
#else
|
||||
tables[i][j].val[0] = vld1_u8(btable[i][j]);
|
||||
tables[i][j].val[1] = vld1_u8(btable[i][j] + 8);
|
||||
#endif
|
||||
}
|
||||
}
|
||||
|
||||
mask1 = vdupq_n_u8(0xf);
|
||||
|
||||
while (dst < d_end) {
|
||||
|
||||
v0 = vld1q_u32(src); src += 4;
|
||||
v1 = vld1q_u32(src); src += 4;
|
||||
v2 = vld1q_u32(src); src += 4;
|
||||
v3 = vld1q_u32(src); src += 4;
|
||||
|
||||
if (altmap) {
|
||||
q0.val[0] = vreinterpretq_u8_u32(v0);
|
||||
q0.val[1] = vreinterpretq_u8_u32(v1);
|
||||
q1.val[0] = vreinterpretq_u8_u32(v2);
|
||||
q1.val[1] = vreinterpretq_u8_u32(v3);
|
||||
} else {
|
||||
r0 = vtrnq_u16(vreinterpretq_u16_u32(v0), vreinterpretq_u16_u32(v2));
|
||||
r1 = vtrnq_u16(vreinterpretq_u16_u32(v1), vreinterpretq_u16_u32(v3));
|
||||
|
||||
q0 = vtrnq_u8(vreinterpretq_u8_u16(r0.val[0]),
|
||||
vreinterpretq_u8_u16(r1.val[0]));
|
||||
q1 = vtrnq_u8(vreinterpretq_u8_u16(r0.val[1]),
|
||||
vreinterpretq_u8_u16(r1.val[1]));
|
||||
}
|
||||
|
||||
si = vandq_u8(q0.val[0], mask1);
|
||||
p0 = vqtbl1q_u8(tables[0][0], si);
|
||||
p1 = vqtbl1q_u8(tables[0][1], si);
|
||||
p2 = vqtbl1q_u8(tables[0][2], si);
|
||||
p3 = vqtbl1q_u8(tables[0][3], si);
|
||||
|
||||
si = vshrq_n_u8(q0.val[0], 4);
|
||||
p0 = veorq_u8(p0, vqtbl1q_u8(tables[1][0], si));
|
||||
p1 = veorq_u8(p1, vqtbl1q_u8(tables[1][1], si));
|
||||
p2 = veorq_u8(p2, vqtbl1q_u8(tables[1][2], si));
|
||||
p3 = veorq_u8(p3, vqtbl1q_u8(tables[1][3], si));
|
||||
|
||||
si = vandq_u8(q0.val[1], mask1);
|
||||
p0 = veorq_u8(p0, vqtbl1q_u8(tables[2][0], si));
|
||||
p1 = veorq_u8(p1, vqtbl1q_u8(tables[2][1], si));
|
||||
p2 = veorq_u8(p2, vqtbl1q_u8(tables[2][2], si));
|
||||
p3 = veorq_u8(p3, vqtbl1q_u8(tables[2][3], si));
|
||||
|
||||
si = vshrq_n_u8(q0.val[1], 4);
|
||||
p0 = veorq_u8(p0, vqtbl1q_u8(tables[3][0], si));
|
||||
p1 = veorq_u8(p1, vqtbl1q_u8(tables[3][1], si));
|
||||
p2 = veorq_u8(p2, vqtbl1q_u8(tables[3][2], si));
|
||||
p3 = veorq_u8(p3, vqtbl1q_u8(tables[3][3], si));
|
||||
|
||||
si = vandq_u8(q1.val[0], mask1);
|
||||
p0 = veorq_u8(p0, vqtbl1q_u8(tables[4][0], si));
|
||||
p1 = veorq_u8(p1, vqtbl1q_u8(tables[4][1], si));
|
||||
p2 = veorq_u8(p2, vqtbl1q_u8(tables[4][2], si));
|
||||
p3 = veorq_u8(p3, vqtbl1q_u8(tables[4][3], si));
|
||||
|
||||
si = vshrq_n_u8(q1.val[0], 4);
|
||||
p0 = veorq_u8(p0, vqtbl1q_u8(tables[5][0], si));
|
||||
p1 = veorq_u8(p1, vqtbl1q_u8(tables[5][1], si));
|
||||
p2 = veorq_u8(p2, vqtbl1q_u8(tables[5][2], si));
|
||||
p3 = veorq_u8(p3, vqtbl1q_u8(tables[5][3], si));
|
||||
|
||||
si = vandq_u8(q1.val[1], mask1);
|
||||
p0 = veorq_u8(p0, vqtbl1q_u8(tables[6][0], si));
|
||||
p1 = veorq_u8(p1, vqtbl1q_u8(tables[6][1], si));
|
||||
p2 = veorq_u8(p2, vqtbl1q_u8(tables[6][2], si));
|
||||
p3 = veorq_u8(p3, vqtbl1q_u8(tables[6][3], si));
|
||||
|
||||
si = vshrq_n_u8(q1.val[1], 4);
|
||||
p0 = veorq_u8(p0, vqtbl1q_u8(tables[7][0], si));
|
||||
p1 = veorq_u8(p1, vqtbl1q_u8(tables[7][1], si));
|
||||
p2 = veorq_u8(p2, vqtbl1q_u8(tables[7][2], si));
|
||||
p3 = veorq_u8(p3, vqtbl1q_u8(tables[7][3], si));
|
||||
|
||||
if (altmap) {
|
||||
s0 = vreinterpretq_u32_u8(p0);
|
||||
s1 = vreinterpretq_u32_u8(p1);
|
||||
s2 = vreinterpretq_u32_u8(p2);
|
||||
s3 = vreinterpretq_u32_u8(p3);
|
||||
} else {
|
||||
q0 = vtrnq_u8(p0, p1);
|
||||
q1 = vtrnq_u8(p2, p3);
|
||||
|
||||
r0 = vtrnq_u16(vreinterpretq_u16_u8(q0.val[0]),
|
||||
vreinterpretq_u16_u8(q1.val[0]));
|
||||
r1 = vtrnq_u16(vreinterpretq_u16_u8(q0.val[1]),
|
||||
vreinterpretq_u16_u8(q1.val[1]));
|
||||
|
||||
s0 = vreinterpretq_u32_u16(r0.val[0]);
|
||||
s1 = vreinterpretq_u32_u16(r1.val[0]);
|
||||
s2 = vreinterpretq_u32_u16(r0.val[1]);
|
||||
s3 = vreinterpretq_u32_u16(r1.val[1]);
|
||||
}
|
||||
|
||||
if (xor) {
|
||||
v0 = vld1q_u32(dst);
|
||||
v1 = vld1q_u32(dst + 4);
|
||||
v2 = vld1q_u32(dst + 8);
|
||||
v3 = vld1q_u32(dst + 12);
|
||||
s0 = veorq_u32(s0, v0);
|
||||
s1 = veorq_u32(s1, v1);
|
||||
s2 = veorq_u32(s2, v2);
|
||||
s3 = veorq_u32(s3, v3);
|
||||
}
|
||||
|
||||
vst1q_u32(dst, s0);
|
||||
vst1q_u32(dst + 4, s1);
|
||||
vst1q_u32(dst + 8, s2);
|
||||
vst1q_u32(dst + 12, s3);
|
||||
|
||||
dst += 16;
|
||||
}
|
||||
}
|
||||
|
||||
static
|
||||
inline
|
||||
void
|
||||
neon_w32_split_4_32_lazy_multiply_region(gf_t *gf, void *src, void *dest, uint32_t val, int bytes, int xor, int altmap)
|
||||
{
|
||||
gf_internal_t *h;
|
||||
int i, j, k;
|
||||
uint32_t pp, v, *s32, *d32, *top, tmp_table[16];
|
||||
uint8_t btable[8][4][16];
|
||||
gf_region_data rd;
|
||||
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; }
|
||||
if (val == 1) { gf_multby_one(src, dest, bytes, xor); return; }
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
pp = h->prim_poly;
|
||||
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, val, xor, 64);
|
||||
gf_do_initial_region_alignment(&rd);
|
||||
|
||||
s32 = (uint32_t *) rd.s_start;
|
||||
d32 = (uint32_t *) rd.d_start;
|
||||
top = (uint32_t *) rd.d_top;
|
||||
|
||||
v = val;
|
||||
for (i = 0; i < 8; i++) {
|
||||
tmp_table[0] = 0;
|
||||
for (j = 1; j < 16; j <<= 1) {
|
||||
for (k = 0; k < j; k++) {
|
||||
tmp_table[k^j] = (v ^ tmp_table[k]);
|
||||
}
|
||||
v = (v & GF_FIRST_BIT) ? ((v << 1) ^ pp) : (v << 1);
|
||||
}
|
||||
for (j = 0; j < 4; j++) {
|
||||
for (k = 0; k < 16; k++) {
|
||||
btable[i][j][k] = (uint8_t) tmp_table[k];
|
||||
tmp_table[k] >>= 8;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (xor)
|
||||
neon_w32_split_4_32_multiply_region(gf, s32, d32, top, btable, val, 1, altmap);
|
||||
else
|
||||
neon_w32_split_4_32_multiply_region(gf, s32, d32, top, btable, val, 0, altmap);
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w32_split_4_32_lazy_multiply_region_neon(gf_t *gf, void *src, void *dest,
|
||||
gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
neon_w32_split_4_32_lazy_multiply_region(gf, src, dest, val, bytes, xor, 0);
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w32_split_4_32_lazy_altmap_multiply_region_neon(gf_t *gf, void *src,
|
||||
void *dest, gf_val_32_t val,
|
||||
int bytes, int xor)
|
||||
{
|
||||
neon_w32_split_4_32_lazy_multiply_region(gf, src, dest, val, bytes, xor, 1);
|
||||
}
|
||||
|
||||
void gf_w32_neon_split_init(gf_t *gf)
|
||||
{
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_4_32_lazy_altmap_multiply_region_neon)
|
||||
else
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w32_split_4_32_lazy_multiply_region_neon)
|
||||
|
||||
}
|
|
@ -0,0 +1,247 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* Copyright (c) 2014: Janne Grunau <j@jannau.net>
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions
|
||||
* are met:
|
||||
*
|
||||
* - Redistributions of source code must retain the above copyright
|
||||
* notice, this list of conditions and the following disclaimer.
|
||||
*
|
||||
* - Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in
|
||||
* the documentation and/or other materials provided with the
|
||||
* distribution.
|
||||
*
|
||||
* - Neither the name of the University of Tennessee nor the names of its
|
||||
* contributors may be used to endorse or promote products derived
|
||||
* from this software without specific prior written permission.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||||
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||||
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||||
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
||||
* HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
||||
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
||||
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
|
||||
* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
|
||||
* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
||||
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY
|
||||
* WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
* POSSIBILITY OF SUCH DAMAGE.
|
||||
*
|
||||
* gf_w4_neon.c
|
||||
*
|
||||
* Neon routines for 4-bit Galois fields
|
||||
*
|
||||
*/
|
||||
|
||||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include "gf_w4.h"
|
||||
|
||||
static
|
||||
gf_val_32_t
|
||||
gf_w4_neon_clm_multiply (gf_t *gf, gf_val_32_t a4, gf_val_32_t b4)
|
||||
{
|
||||
gf_val_32_t rv = 0;
|
||||
poly8x8_t result, prim_poly;
|
||||
poly8x8_t a, b, w;
|
||||
uint8x8_t v;
|
||||
gf_internal_t * h = gf->scratch;
|
||||
|
||||
a = vdup_n_p8 (a4);
|
||||
b = vdup_n_p8 (b4);
|
||||
|
||||
prim_poly = vdup_n_p8 ((uint32_t)(h->prim_poly & 0x1fULL));
|
||||
|
||||
/* Do the initial multiply */
|
||||
result = vmul_p8 (a, b);
|
||||
v = vshr_n_u8 (vreinterpret_u8_p8(result), 4);
|
||||
w = vmul_p8 (prim_poly, vreinterpret_p8_u8(v));
|
||||
result = vreinterpret_p8_u8 (veor_u8 (vreinterpret_u8_p8(result), vreinterpret_u8_p8(w)));
|
||||
|
||||
/* Extracts 32 bit value from result. */
|
||||
rv = (gf_val_32_t)vget_lane_u8 (vreinterpret_u8_p8 (result), 0);
|
||||
|
||||
return rv;
|
||||
}
|
||||
|
||||
static inline void
|
||||
neon_clm_multiply_region_from_single (gf_t *gf, uint8_t *s8, uint8_t *d8,
|
||||
gf_val_32_t val, uint8_t *d_end, int xor)
|
||||
{
|
||||
gf_internal_t * h = gf->scratch;
|
||||
poly8x8_t prim_poly;
|
||||
poly8x8_t a, w, even, odd;
|
||||
uint8x8_t b, c, v, mask;
|
||||
|
||||
a = vdup_n_p8 (val);
|
||||
mask = vdup_n_u8 (0xf);
|
||||
prim_poly = vdup_n_p8 ((uint8_t)(h->prim_poly & 0x1fULL));
|
||||
|
||||
while (d8 < d_end) {
|
||||
b = vld1_u8 (s8);
|
||||
|
||||
even = vreinterpret_p8_u8 (vand_u8 (b, mask));
|
||||
odd = vreinterpret_p8_u8 (vshr_n_u8 (b, 4));
|
||||
|
||||
if (xor)
|
||||
c = vld1_u8 (d8);
|
||||
|
||||
even = vmul_p8 (a, even);
|
||||
odd = vmul_p8 (a, odd);
|
||||
|
||||
v = vshr_n_u8 (vreinterpret_u8_p8(even), 4);
|
||||
w = vmul_p8 (prim_poly, vreinterpret_p8_u8(v));
|
||||
even = vreinterpret_p8_u8 (veor_u8 (vreinterpret_u8_p8(even), vreinterpret_u8_p8(w)));
|
||||
|
||||
v = vshr_n_u8 (vreinterpret_u8_p8(odd), 4);
|
||||
w = vmul_p8 (prim_poly, vreinterpret_p8_u8(v));
|
||||
odd = vreinterpret_p8_u8 (veor_u8 (vreinterpret_u8_p8(odd), vreinterpret_u8_p8(w)));
|
||||
|
||||
v = veor_u8 (vreinterpret_u8_p8 (even), vshl_n_u8 (vreinterpret_u8_p8 (odd), 4));
|
||||
|
||||
if (xor)
|
||||
v = veor_u8 (c, v);
|
||||
|
||||
vst1_u8 (d8, v);
|
||||
|
||||
d8 += 8;
|
||||
s8 += 8;
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
static void
|
||||
gf_w4_neon_clm_multiply_region_from_single (gf_t *gf, void *src, void *dest,
|
||||
gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
gf_region_data rd;
|
||||
uint8_t *s8;
|
||||
uint8_t *d8;
|
||||
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; }
|
||||
if (val == 1) { gf_multby_one(src, dest, bytes, xor); return; }
|
||||
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, val, xor, 16);
|
||||
gf_do_initial_region_alignment(&rd);
|
||||
|
||||
s8 = (uint8_t *) rd.s_start;
|
||||
d8 = (uint8_t *) rd.d_start;
|
||||
|
||||
if (xor)
|
||||
neon_clm_multiply_region_from_single (gf, s8, d8, val, rd.d_top, 1);
|
||||
else
|
||||
neon_clm_multiply_region_from_single (gf, s8, d8, val, rd.d_top, 0);
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
}
|
||||
|
||||
#ifndef ARCH_AARCH64
|
||||
#define vqtbl1q_u8(tbl, v) vcombine_u8(vtbl2_u8(tbl, vget_low_u8(v)), \
|
||||
vtbl2_u8(tbl, vget_high_u8(v)))
|
||||
#endif
|
||||
|
||||
static
|
||||
inline
|
||||
void
|
||||
w4_single_table_multiply_region_neon(gf_t *gf, uint8_t *src, uint8_t *dst,
|
||||
uint8_t * d_end, gf_val_32_t val, int xor)
|
||||
{
|
||||
struct gf_single_table_data *std;
|
||||
uint8_t *base;
|
||||
uint8x16_t r, va, vh, vl, loset;
|
||||
|
||||
#ifdef ARCH_AARCH64
|
||||
uint8x16_t th, tl;
|
||||
#else
|
||||
uint8x8x2_t th, tl;
|
||||
#endif
|
||||
|
||||
std = (struct gf_single_table_data *) ((gf_internal_t *) (gf->scratch))->private;
|
||||
base = (uint8_t *) std->mult;
|
||||
base += (val << GF_FIELD_WIDTH);
|
||||
|
||||
#ifdef ARCH_AARCH64
|
||||
tl = vld1q_u8 (base);
|
||||
th = vshlq_n_u8 (tl, 4);
|
||||
#else
|
||||
tl.val[0] = vld1_u8 (base);
|
||||
tl.val[1] = vld1_u8 (base + 8);
|
||||
th.val[0] = vshl_n_u8 (tl.val[0], 4);
|
||||
th.val[1] = vshl_n_u8 (tl.val[1], 4);
|
||||
#endif
|
||||
|
||||
loset = vdupq_n_u8(0xf);
|
||||
|
||||
while (dst < d_end) {
|
||||
va = vld1q_u8 (src);
|
||||
|
||||
vh = vshrq_n_u8 (va, 4);
|
||||
vl = vandq_u8 (va, loset);
|
||||
|
||||
if (xor)
|
||||
va = vld1q_u8 (dst);
|
||||
|
||||
vh = vqtbl1q_u8 (th, vh);
|
||||
vl = vqtbl1q_u8 (tl, vl);
|
||||
|
||||
r = veorq_u8 (vh, vl);
|
||||
|
||||
if (xor)
|
||||
r = veorq_u8 (va, r);
|
||||
|
||||
vst1q_u8 (dst, r);
|
||||
|
||||
dst += 16;
|
||||
src += 16;
|
||||
}
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w4_single_table_multiply_region_neon(gf_t *gf, void *src, void *dest,
|
||||
gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
gf_region_data rd;
|
||||
uint8_t *sptr, *dptr, *top;
|
||||
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; }
|
||||
if (val == 1) { gf_multby_one(src, dest, bytes, xor); return; }
|
||||
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, val, xor, 16);
|
||||
gf_do_initial_region_alignment(&rd);
|
||||
|
||||
sptr = rd.s_start;
|
||||
dptr = rd.d_start;
|
||||
top = rd.d_top;
|
||||
|
||||
if (xor)
|
||||
w4_single_table_multiply_region_neon(gf, sptr, dptr, top, val, 1);
|
||||
else
|
||||
w4_single_table_multiply_region_neon(gf, sptr, dptr, top, val, 0);
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
|
||||
}
|
||||
|
||||
|
||||
int gf_w4_neon_cfm_init(gf_t *gf)
|
||||
{
|
||||
// single clm multiplication probably pointless
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w4_neon_clm_multiply)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_neon_clm_multiply_region_from_single)
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
||||
void gf_w4_neon_single_table_init(gf_t *gf)
|
||||
{
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w4_single_table_multiply_region_neon)
|
||||
}
|
|
@ -0,0 +1,333 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* Copyright (c) 2014: Janne Grunau <j@jannau.net>
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions
|
||||
* are met:
|
||||
*
|
||||
* - Redistributions of source code must retain the above copyright
|
||||
* notice, this list of conditions and the following disclaimer.
|
||||
*
|
||||
* - Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in
|
||||
* the documentation and/or other materials provided with the
|
||||
* distribution.
|
||||
*
|
||||
* - Neither the name of the University of Tennessee nor the names of its
|
||||
* contributors may be used to endorse or promote products derived
|
||||
* from this software without specific prior written permission.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||||
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||||
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||||
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
||||
* HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
||||
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
||||
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
|
||||
* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
|
||||
* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
||||
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY
|
||||
* WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
* POSSIBILITY OF SUCH DAMAGE.
|
||||
*
|
||||
* gf_w64_neon.c
|
||||
*
|
||||
* Neon routines for 64-bit Galois fields
|
||||
*
|
||||
*/
|
||||
|
||||
#include "gf_int.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include "gf_w64.h"
|
||||
|
||||
|
||||
#ifndef ARCH_AARCH64
|
||||
#define vqtbl1q_u8(tbl, v) vcombine_u8(vtbl2_u8(tbl, vget_low_u8(v)), \
|
||||
vtbl2_u8(tbl, vget_high_u8(v)))
|
||||
#endif
|
||||
|
||||
static
|
||||
inline
|
||||
void
|
||||
neon_w64_split_4_lazy_altmap_multiply_region(gf_t *gf, uint64_t *src,
|
||||
uint64_t *dst, uint64_t *d_end,
|
||||
uint64_t val, int xor)
|
||||
{
|
||||
unsigned i, j, k;
|
||||
uint8_t btable[16];
|
||||
#ifdef ARCH_AARCH64
|
||||
uint8x16_t tables[16][8];
|
||||
#else
|
||||
uint8x8x2_t tables[16][8];
|
||||
#endif
|
||||
uint8x16_t p[8], mask1, si;
|
||||
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
struct gf_split_4_64_lazy_data *ld = (struct gf_split_4_64_lazy_data *) h->private;
|
||||
|
||||
for (i = 0; i < 16; i++) {
|
||||
for (j = 0; j < 8; j++) {
|
||||
for (k = 0; k < 16; k++) {
|
||||
btable[k] = (uint8_t) ld->tables[i][k];
|
||||
ld->tables[i][k] >>= 8;
|
||||
}
|
||||
#ifdef ARCH_AARCH64
|
||||
tables[i][j] = vld1q_u8(btable);
|
||||
#else
|
||||
tables[i][j].val[0] = vld1_u8(btable);
|
||||
tables[i][j].val[1] = vld1_u8(btable + 8);
|
||||
#endif
|
||||
}
|
||||
}
|
||||
|
||||
mask1 = vdupq_n_u8(0xf);
|
||||
|
||||
while (dst < d_end) {
|
||||
|
||||
if (xor) {
|
||||
for (i = 0; i < 8; i++)
|
||||
p[i] = vld1q_u8((uint8_t *) (dst + i * 2));
|
||||
} else {
|
||||
for (i = 0; i < 8; i++)
|
||||
p[i] = vdupq_n_u8(0);
|
||||
}
|
||||
|
||||
i = 0;
|
||||
for (k = 0; k < 8; k++) {
|
||||
uint8x16_t v0 = vld1q_u8((uint8_t *) src);
|
||||
src += 2;
|
||||
|
||||
si = vandq_u8(v0, mask1);
|
||||
for (j = 0; j < 8; j++) {
|
||||
p[j] = veorq_u8(p[j], vqtbl1q_u8(tables[i][j], si));
|
||||
}
|
||||
i++;
|
||||
si = vshrq_n_u8(v0, 4);
|
||||
for (j = 0; j < 8; j++) {
|
||||
p[j] = veorq_u8(p[j], vqtbl1q_u8(tables[i][j], si));
|
||||
}
|
||||
i++;
|
||||
|
||||
}
|
||||
for (i = 0; i < 8; i++) {
|
||||
vst1q_u8((uint8_t *) dst, p[i]);
|
||||
dst += 2;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static
|
||||
inline
|
||||
void
|
||||
neon_w64_split_4_lazy_multiply_region(gf_t *gf, uint64_t *src, uint64_t *dst,
|
||||
uint64_t *d_end, uint64_t val, int xor)
|
||||
{
|
||||
unsigned i, j, k;
|
||||
uint8_t btable[16];
|
||||
#ifdef ARCH_AARCH64
|
||||
uint8x16_t tables[16][8];
|
||||
#else
|
||||
uint8x8x2_t tables[16][8];
|
||||
#endif
|
||||
uint8x16_t p[8], mask1, si;
|
||||
uint64x2_t st[8];
|
||||
uint32x4x2_t s32[4];
|
||||
uint16x8x2_t s16[4];
|
||||
uint8x16x2_t s8[4];
|
||||
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
struct gf_split_4_64_lazy_data *ld = (struct gf_split_4_64_lazy_data *) h->private;
|
||||
|
||||
for (i = 0; i < 16; i++) {
|
||||
for (j = 0; j < 8; j++) {
|
||||
for (k = 0; k < 16; k++) {
|
||||
btable[k] = (uint8_t) ld->tables[i][k];
|
||||
ld->tables[i][k] >>= 8;
|
||||
}
|
||||
#ifdef ARCH_AARCH64
|
||||
tables[i][j] = vld1q_u8(btable);
|
||||
#else
|
||||
tables[i][j].val[0] = vld1_u8(btable);
|
||||
tables[i][j].val[1] = vld1_u8(btable + 8);
|
||||
#endif
|
||||
}
|
||||
}
|
||||
|
||||
mask1 = vdupq_n_u8(0xf);
|
||||
|
||||
while (dst < d_end) {
|
||||
|
||||
for (k = 0; k < 8; k++) {
|
||||
st[k] = vld1q_u64(src);
|
||||
src += 2;
|
||||
p[k] = vdupq_n_u8(0);
|
||||
}
|
||||
|
||||
s32[0] = vuzpq_u32(vreinterpretq_u32_u64(st[0]),
|
||||
vreinterpretq_u32_u64(st[1]));
|
||||
s32[1] = vuzpq_u32(vreinterpretq_u32_u64(st[2]),
|
||||
vreinterpretq_u32_u64(st[3]));
|
||||
s32[2] = vuzpq_u32(vreinterpretq_u32_u64(st[4]),
|
||||
vreinterpretq_u32_u64(st[5]));
|
||||
s32[3] = vuzpq_u32(vreinterpretq_u32_u64(st[6]),
|
||||
vreinterpretq_u32_u64(st[7]));
|
||||
|
||||
s16[0] = vuzpq_u16(vreinterpretq_u16_u32(s32[0].val[0]),
|
||||
vreinterpretq_u16_u32(s32[1].val[0]));
|
||||
s16[1] = vuzpq_u16(vreinterpretq_u16_u32(s32[2].val[0]),
|
||||
vreinterpretq_u16_u32(s32[3].val[0]));
|
||||
s16[2] = vuzpq_u16(vreinterpretq_u16_u32(s32[0].val[1]),
|
||||
vreinterpretq_u16_u32(s32[1].val[1]));
|
||||
s16[3] = vuzpq_u16(vreinterpretq_u16_u32(s32[2].val[1]),
|
||||
vreinterpretq_u16_u32(s32[3].val[1]));
|
||||
|
||||
s8[0] = vuzpq_u8(vreinterpretq_u8_u16(s16[0].val[0]),
|
||||
vreinterpretq_u8_u16(s16[1].val[0]));
|
||||
s8[1] = vuzpq_u8(vreinterpretq_u8_u16(s16[0].val[1]),
|
||||
vreinterpretq_u8_u16(s16[1].val[1]));
|
||||
s8[2] = vuzpq_u8(vreinterpretq_u8_u16(s16[2].val[0]),
|
||||
vreinterpretq_u8_u16(s16[3].val[0]));
|
||||
s8[3] = vuzpq_u8(vreinterpretq_u8_u16(s16[2].val[1]),
|
||||
vreinterpretq_u8_u16(s16[3].val[1]));
|
||||
|
||||
i = 0;
|
||||
for (k = 0; k < 8; k++) {
|
||||
si = vandq_u8(s8[k >> 1].val[k & 1], mask1);
|
||||
for (j = 0; j < 8; j++) {
|
||||
p[j] = veorq_u8(p[j], vqtbl1q_u8(tables[i][j], si));
|
||||
}
|
||||
i++;
|
||||
si = vshrq_n_u8(s8[k >> 1].val[k & 1], 4);
|
||||
for (j = 0; j < 8; j++) {
|
||||
p[j] = veorq_u8(p[j], vqtbl1q_u8(tables[i][j], si));
|
||||
}
|
||||
i++;
|
||||
}
|
||||
|
||||
s8[0] = vzipq_u8(p[0], p[1]);
|
||||
s8[1] = vzipq_u8(p[2], p[3]);
|
||||
s8[2] = vzipq_u8(p[4], p[5]);
|
||||
s8[3] = vzipq_u8(p[6], p[7]);
|
||||
|
||||
s16[0] = vzipq_u16(vreinterpretq_u16_u8(s8[0].val[0]),
|
||||
vreinterpretq_u16_u8(s8[1].val[0]));
|
||||
s16[1] = vzipq_u16(vreinterpretq_u16_u8(s8[2].val[0]),
|
||||
vreinterpretq_u16_u8(s8[3].val[0]));
|
||||
s16[2] = vzipq_u16(vreinterpretq_u16_u8(s8[0].val[1]),
|
||||
vreinterpretq_u16_u8(s8[1].val[1]));
|
||||
s16[3] = vzipq_u16(vreinterpretq_u16_u8(s8[2].val[1]),
|
||||
vreinterpretq_u16_u8(s8[3].val[1]));
|
||||
|
||||
s32[0] = vzipq_u32(vreinterpretq_u32_u16(s16[0].val[0]),
|
||||
vreinterpretq_u32_u16(s16[1].val[0]));
|
||||
s32[1] = vzipq_u32(vreinterpretq_u32_u16(s16[0].val[1]),
|
||||
vreinterpretq_u32_u16(s16[1].val[1]));
|
||||
s32[2] = vzipq_u32(vreinterpretq_u32_u16(s16[2].val[0]),
|
||||
vreinterpretq_u32_u16(s16[3].val[0]));
|
||||
s32[3] = vzipq_u32(vreinterpretq_u32_u16(s16[2].val[1]),
|
||||
vreinterpretq_u32_u16(s16[3].val[1]));
|
||||
|
||||
for (k = 0; k < 8; k ++) {
|
||||
st[k] = vreinterpretq_u64_u32(s32[k >> 1].val[k & 1]);
|
||||
}
|
||||
|
||||
if (xor) {
|
||||
for (i = 0; i < 8; i++) {
|
||||
uint64x2_t t1 = vld1q_u64(dst);
|
||||
vst1q_u64(dst, veorq_u64(st[i], t1));
|
||||
dst += 2;
|
||||
}
|
||||
} else {
|
||||
for (i = 0; i < 8; i++) {
|
||||
vst1q_u64(dst, st[i]);
|
||||
dst += 2;
|
||||
}
|
||||
}
|
||||
|
||||
}
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w64_neon_split_4_lazy_multiply_region(gf_t *gf, void *src, void *dest,
|
||||
uint64_t val, int bytes, int xor,
|
||||
int altmap)
|
||||
{
|
||||
gf_internal_t *h;
|
||||
int i, j, k;
|
||||
uint64_t pp, v, *s64, *d64, *top;
|
||||
struct gf_split_4_64_lazy_data *ld;
|
||||
gf_region_data rd;
|
||||
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; }
|
||||
if (val == 1) { gf_multby_one(src, dest, bytes, xor); return; }
|
||||
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, val, xor, 128);
|
||||
gf_do_initial_region_alignment(&rd);
|
||||
|
||||
s64 = (uint64_t *) rd.s_start;
|
||||
d64 = (uint64_t *) rd.d_start;
|
||||
top = (uint64_t *) rd.d_top;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
pp = h->prim_poly;
|
||||
ld = (struct gf_split_4_64_lazy_data *) h->private;
|
||||
|
||||
v = val;
|
||||
for (i = 0; i < 16; i++) {
|
||||
ld->tables[i][0] = 0;
|
||||
for (j = 1; j < 16; j <<= 1) {
|
||||
for (k = 0; k < j; k++) {
|
||||
ld->tables[i][k^j] = (v ^ ld->tables[i][k]);
|
||||
}
|
||||
v = (v & GF_FIRST_BIT) ? ((v << 1) ^ pp) : (v << 1);
|
||||
}
|
||||
}
|
||||
|
||||
if (altmap) {
|
||||
if (xor)
|
||||
neon_w64_split_4_lazy_altmap_multiply_region(gf, s64, d64, top, val, 1);
|
||||
else
|
||||
neon_w64_split_4_lazy_altmap_multiply_region(gf, s64, d64, top, val, 0);
|
||||
} else {
|
||||
if (xor)
|
||||
neon_w64_split_4_lazy_multiply_region(gf, s64, d64, top, val, 1);
|
||||
else
|
||||
neon_w64_split_4_lazy_multiply_region(gf, s64, d64, top, val, 0);
|
||||
}
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w64_split_4_64_lazy_multiply_region_neon(gf_t *gf, void *src, void *dest,
|
||||
uint64_t val, int bytes, int xor)
|
||||
{
|
||||
gf_w64_neon_split_4_lazy_multiply_region(gf, src, dest, val, bytes, xor, 0);
|
||||
}
|
||||
|
||||
static
|
||||
void
|
||||
gf_w64_split_4_64_lazy_altmap_multiply_region_neon(gf_t *gf, void *src,
|
||||
void *dest, uint64_t val,
|
||||
int bytes, int xor)
|
||||
{
|
||||
gf_w64_neon_split_4_lazy_multiply_region(gf, src, dest, val, bytes, xor, 1);
|
||||
}
|
||||
|
||||
void gf_w64_neon_split_init(gf_t *gf)
|
||||
{
|
||||
gf_internal_t *h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if (h->region_type & GF_REGION_ALTMAP)
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_4_64_lazy_altmap_multiply_region_neon)
|
||||
else
|
||||
SET_FUNCTION(gf,multiply_region,w64,gf_w64_split_4_64_lazy_multiply_region_neon)
|
||||
|
||||
}
|
|
@ -0,0 +1,302 @@
|
|||
/*
|
||||
* GF-Complete: A Comprehensive Open Source Library for Galois Field Arithmetic
|
||||
* James S. Plank, Ethan L. Miller, Kevin M. Greenan,
|
||||
* Benjamin A. Arnold, John A. Burnum, Adam W. Disney, Allen C. McBride.
|
||||
*
|
||||
* Copyright (c) 2014: Janne Grunau <j@jannau.net>
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions
|
||||
* are met:
|
||||
*
|
||||
* - Redistributions of source code must retain the above copyright
|
||||
* notice, this list of conditions and the following disclaimer.
|
||||
*
|
||||
* - Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in
|
||||
* the documentation and/or other materials provided with the
|
||||
* distribution.
|
||||
*
|
||||
* - Neither the name of the University of Tennessee nor the names of its
|
||||
* contributors may be used to endorse or promote products derived
|
||||
* from this software without specific prior written permission.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||||
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||||
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||||
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
||||
* HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
||||
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
||||
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
|
||||
* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
|
||||
* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
||||
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY
|
||||
* WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
* POSSIBILITY OF SUCH DAMAGE.
|
||||
*
|
||||
* gf_w8_neon.c
|
||||
*
|
||||
* Neon optimized routines for 8-bit Galois fields
|
||||
*
|
||||
*/
|
||||
|
||||
#include "gf_int.h"
|
||||
#include "gf_w8.h"
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
|
||||
/* ARM NEON reducing macro for the carry free multiplication
|
||||
* vmull_p8 is the carryless multiply operation. Here vshrn_n_u16 shifts
|
||||
* the result to the right by 1 byte. This allows us to multiply
|
||||
* the prim_poly by the leading bits of the result. We then xor the result
|
||||
* of that operation back with the result. */
|
||||
#define NEON_CFM_REDUCE(v, w, result, prim_poly, initial) \
|
||||
do { \
|
||||
if (initial) \
|
||||
v = vshrn_n_u16 (vreinterpretq_u16_p16(result), 8); \
|
||||
else \
|
||||
v = veor_u8 (v, vshrn_n_u16 (vreinterpretq_u16_p16(result), 8)); \
|
||||
w = vmull_p8 (prim_poly, vreinterpret_p8_u8(v)); \
|
||||
result = vreinterpretq_p16_u16 (veorq_u16 (vreinterpretq_u16_p16(result), vreinterpretq_u16_p16(w))); \
|
||||
} while (0)
|
||||
|
||||
static
|
||||
inline
|
||||
gf_val_32_t
|
||||
gf_w8_neon_clm_multiply_x (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8, int x)
|
||||
{
|
||||
gf_val_32_t rv = 0;
|
||||
poly8x8_t a, b;
|
||||
uint8x8_t v;
|
||||
poly16x8_t result;
|
||||
poly8x8_t prim_poly;
|
||||
poly16x8_t w;
|
||||
gf_internal_t * h = gf->scratch;
|
||||
|
||||
a = vdup_n_p8 (a8);
|
||||
b = vdup_n_p8 (b8);
|
||||
|
||||
prim_poly = vdup_n_p8 ((uint32_t)(h->prim_poly & 0x1ffULL));
|
||||
|
||||
/* Do the initial multiply */
|
||||
result = vmull_p8 (a, b);
|
||||
|
||||
/* Ben: Do prim_poly reduction twice. We are guaranteed that we will only
|
||||
have to do the reduction at most twice, because (w-2)/z == 2. Where
|
||||
z is equal to the number of zeros after the leading 1 */
|
||||
NEON_CFM_REDUCE (v, w, result, prim_poly, 1);
|
||||
NEON_CFM_REDUCE (v, w, result, prim_poly, 0);
|
||||
if (x >= 3) {
|
||||
NEON_CFM_REDUCE (v, w, result, prim_poly, 0);
|
||||
}
|
||||
if (x >= 4) {
|
||||
NEON_CFM_REDUCE (v, w, result, prim_poly, 0);
|
||||
}
|
||||
/* Extracts 32 bit value from result. */
|
||||
rv = (gf_val_32_t)vget_lane_u8 (vmovn_u16 (vreinterpretq_u16_p16 (result)), 0);
|
||||
|
||||
return rv;
|
||||
}
|
||||
|
||||
#define CLM_MULTIPLY(x) \
|
||||
static gf_val_32_t gf_w8_neon_clm_multiply_ ## x (gf_t *gf, gf_val_32_t a8, gf_val_32_t b8) \
|
||||
{\
|
||||
return gf_w8_neon_clm_multiply_x (gf, a8, b8, x);\
|
||||
}
|
||||
|
||||
CLM_MULTIPLY(2)
|
||||
CLM_MULTIPLY(3)
|
||||
CLM_MULTIPLY(4)
|
||||
|
||||
static inline void
|
||||
neon_clm_multiply_region_from_single_x(gf_t *gf, uint8_t *s8, uint8_t *d8,
|
||||
gf_val_32_t val, uint8_t *d_end,
|
||||
int xor, int x)
|
||||
{
|
||||
gf_internal_t * h = gf->scratch;
|
||||
poly8x8_t a, b;
|
||||
uint8x8_t c, v;
|
||||
poly16x8_t result;
|
||||
poly8x8_t prim_poly;
|
||||
poly16x8_t w;
|
||||
|
||||
a = vdup_n_p8 (val);
|
||||
prim_poly = vdup_n_p8 ((uint8_t)(h->prim_poly & 0xffULL));
|
||||
|
||||
while (d8 < d_end) {
|
||||
b = vld1_p8 ((poly8_t *) s8);
|
||||
|
||||
if (xor)
|
||||
c = vld1_u8 (d8);
|
||||
|
||||
result = vmull_p8 (a, b);
|
||||
|
||||
NEON_CFM_REDUCE(v, w, result, prim_poly, 1);
|
||||
NEON_CFM_REDUCE (v, w, result, prim_poly, 0);
|
||||
if (x >= 3) {
|
||||
NEON_CFM_REDUCE (v, w, result, prim_poly, 0);
|
||||
}
|
||||
if (x >= 4) {
|
||||
NEON_CFM_REDUCE (v, w, result, prim_poly, 0);
|
||||
}
|
||||
v = vmovn_u16 (vreinterpretq_u16_p16 (result));
|
||||
if (xor)
|
||||
v = veor_u8 (c, v);
|
||||
|
||||
vst1_u8 (d8, v);
|
||||
|
||||
d8 += 8;
|
||||
s8 += 8;
|
||||
}
|
||||
}
|
||||
|
||||
#define CLM_MULT_REGION(x) \
|
||||
static void \
|
||||
gf_w8_neon_clm_multiply_region_from_single_ ## x (gf_t *gf, void *src, \
|
||||
void *dest, \
|
||||
gf_val_32_t val, int bytes, \
|
||||
int xor) \
|
||||
{ \
|
||||
gf_region_data rd; \
|
||||
uint8_t *s8; \
|
||||
uint8_t *d8; \
|
||||
\
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; } \
|
||||
if (val == 1) { gf_multby_one(src, dest, bytes, xor); return; } \
|
||||
\
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, val, xor, 16); \
|
||||
gf_do_initial_region_alignment(&rd); \
|
||||
s8 = (uint8_t *) rd.s_start; \
|
||||
d8 = (uint8_t *) rd.d_start; \
|
||||
\
|
||||
if (xor) \
|
||||
neon_clm_multiply_region_from_single_x (gf, s8, d8, val, rd.d_top, 1, x); \
|
||||
else \
|
||||
neon_clm_multiply_region_from_single_x (gf, s8, d8, val, rd.d_top, 0, x);\
|
||||
gf_do_final_region_alignment(&rd); \
|
||||
}
|
||||
|
||||
CLM_MULT_REGION(2)
|
||||
CLM_MULT_REGION(3)
|
||||
CLM_MULT_REGION(4)
|
||||
|
||||
|
||||
int gf_w8_neon_cfm_init(gf_t *gf)
|
||||
{
|
||||
gf_internal_t *h;
|
||||
|
||||
h = (gf_internal_t *) gf->scratch;
|
||||
|
||||
if ((0xe0 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_neon_clm_multiply_2)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_neon_clm_multiply_region_from_single_2)
|
||||
}else if ((0xc0 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_neon_clm_multiply_3)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_neon_clm_multiply_region_from_single_3)
|
||||
}else if ((0x80 & h->prim_poly) == 0){
|
||||
SET_FUNCTION(gf,multiply,w32,gf_w8_neon_clm_multiply_4)
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_neon_clm_multiply_region_from_single_4)
|
||||
}else{
|
||||
return 0;
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
||||
#ifndef ARCH_AARCH64
|
||||
#define vqtbl1q_u8(tbl, v) vcombine_u8(vtbl2_u8(tbl, vget_low_u8(v)), \
|
||||
vtbl2_u8(tbl, vget_high_u8(v)))
|
||||
#endif
|
||||
|
||||
static
|
||||
void
|
||||
gf_w8_split_multiply_region_neon(gf_t *gf, void *src, void *dest, gf_val_32_t val, int bytes, int xor)
|
||||
{
|
||||
uint8_t *bh, *bl, *sptr, *dptr;
|
||||
uint8x16_t r, va, vh, vl, loset;
|
||||
#ifdef ARCH_AARCH64
|
||||
uint8x16_t mth, mtl;
|
||||
#else
|
||||
uint8x8x2_t mth, mtl;
|
||||
#endif
|
||||
struct gf_w8_half_table_data *htd;
|
||||
gf_region_data rd;
|
||||
|
||||
if (val == 0) { gf_multby_zero(dest, bytes, xor); return; }
|
||||
if (val == 1) { gf_multby_one(src, dest, bytes, xor); return; }
|
||||
|
||||
htd = (struct gf_w8_half_table_data *) ((gf_internal_t *) (gf->scratch))->private;
|
||||
|
||||
gf_set_region_data(&rd, gf, src, dest, bytes, val, xor, 16);
|
||||
gf_do_initial_region_alignment(&rd);
|
||||
|
||||
bh = (uint8_t *) htd->high;
|
||||
bh += (val << 4);
|
||||
bl = (uint8_t *) htd->low;
|
||||
bl += (val << 4);
|
||||
|
||||
sptr = rd.s_start;
|
||||
dptr = rd.d_start;
|
||||
|
||||
#ifdef ARCH_AARCH64
|
||||
mth = vld1q_u8 (bh);
|
||||
mtl = vld1q_u8 (bl);
|
||||
#else
|
||||
mth.val[0] = vld1_u8 (bh);
|
||||
mtl.val[0] = vld1_u8 (bl);
|
||||
mth.val[1] = vld1_u8 (bh + 8);
|
||||
mtl.val[1] = vld1_u8 (bl + 8);
|
||||
#endif
|
||||
|
||||
loset = vdupq_n_u8(0xf);
|
||||
|
||||
if (xor) {
|
||||
while (sptr < (uint8_t *) rd.s_top) {
|
||||
va = vld1q_u8 (sptr);
|
||||
|
||||
vh = vshrq_n_u8 (va, 4);
|
||||
vl = vandq_u8 (va, loset);
|
||||
va = vld1q_u8 (dptr);
|
||||
|
||||
vh = vqtbl1q_u8 (mth, vh);
|
||||
vl = vqtbl1q_u8 (mtl, vl);
|
||||
|
||||
r = veorq_u8 (vh, vl);
|
||||
|
||||
vst1q_u8 (dptr, veorq_u8 (va, r));
|
||||
|
||||
dptr += 16;
|
||||
sptr += 16;
|
||||
}
|
||||
} else {
|
||||
while (sptr < (uint8_t *) rd.s_top) {
|
||||
va = vld1q_u8 (sptr);
|
||||
|
||||
vh = vshrq_n_u8 (va, 4);
|
||||
vl = vandq_u8 (va, loset);
|
||||
#ifdef ARCH_AARCH64
|
||||
vh = vqtbl1q_u8 (mth, vh);
|
||||
vl = vqtbl1q_u8 (mtl, vl);
|
||||
#else
|
||||
vh = vcombine_u8 (vtbl2_u8 (mth, vget_low_u8 (vh)),
|
||||
vtbl2_u8 (mth, vget_high_u8 (vh)));
|
||||
vl = vcombine_u8 (vtbl2_u8 (mtl, vget_low_u8 (vl)),
|
||||
vtbl2_u8 (mtl, vget_high_u8 (vl)));
|
||||
#endif
|
||||
|
||||
r = veorq_u8 (vh, vl);
|
||||
|
||||
vst1q_u8(dptr, r);
|
||||
|
||||
dptr += 16;
|
||||
sptr += 16;
|
||||
}
|
||||
}
|
||||
|
||||
gf_do_final_region_alignment(&rd);
|
||||
}
|
||||
|
||||
|
||||
void gf_w8_neon_split_init(gf_t *gf)
|
||||
{
|
||||
SET_FUNCTION(gf,multiply_region,w32,gf_w8_split_multiply_region_neon)
|
||||
}
|
139
test-driver
|
@ -1,139 +0,0 @@
|
|||
#! /bin/sh
|
||||
# test-driver - basic testsuite driver script.
|
||||
|
||||
scriptversion=2013-07-13.22; # UTC
|
||||
|
||||
# Copyright (C) 2011-2013 Free Software Foundation, Inc.
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation; either version 2, or (at your option)
|
||||
# any later version.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
||||
# As a special exception to the GNU General Public License, if you
|
||||
# distribute this file as part of a program that contains a
|
||||
# configuration script generated by Autoconf, you may include it under
|
||||
# the same distribution terms that you use for the rest of that program.
|
||||
|
||||
# This file is maintained in Automake, please report
|
||||
# bugs to <bug-automake@gnu.org> or send patches to
|
||||
# <automake-patches@gnu.org>.
|
||||
|
||||
# Make unconditional expansion of undefined variables an error. This
|
||||
# helps a lot in preventing typo-related bugs.
|
||||
set -u
|
||||
|
||||
usage_error ()
|
||||
{
|
||||
echo "$0: $*" >&2
|
||||
print_usage >&2
|
||||
exit 2
|
||||
}
|
||||
|
||||
print_usage ()
|
||||
{
|
||||
cat <<END
|
||||
Usage:
|
||||
test-driver --test-name=NAME --log-file=PATH --trs-file=PATH
|
||||
[--expect-failure={yes|no}] [--color-tests={yes|no}]
|
||||
[--enable-hard-errors={yes|no}] [--]
|
||||
TEST-SCRIPT [TEST-SCRIPT-ARGUMENTS]
|
||||
The '--test-name', '--log-file' and '--trs-file' options are mandatory.
|
||||
END
|
||||
}
|
||||
|
||||
test_name= # Used for reporting.
|
||||
log_file= # Where to save the output of the test script.
|
||||
trs_file= # Where to save the metadata of the test run.
|
||||
expect_failure=no
|
||||
color_tests=no
|
||||
enable_hard_errors=yes
|
||||
while test $# -gt 0; do
|
||||
case $1 in
|
||||
--help) print_usage; exit $?;;
|
||||
--version) echo "test-driver $scriptversion"; exit $?;;
|
||||
--test-name) test_name=$2; shift;;
|
||||
--log-file) log_file=$2; shift;;
|
||||
--trs-file) trs_file=$2; shift;;
|
||||
--color-tests) color_tests=$2; shift;;
|
||||
--expect-failure) expect_failure=$2; shift;;
|
||||
--enable-hard-errors) enable_hard_errors=$2; shift;;
|
||||
--) shift; break;;
|
||||
-*) usage_error "invalid option: '$1'";;
|
||||
*) break;;
|
||||
esac
|
||||
shift
|
||||
done
|
||||
|
||||
missing_opts=
|
||||
test x"$test_name" = x && missing_opts="$missing_opts --test-name"
|
||||
test x"$log_file" = x && missing_opts="$missing_opts --log-file"
|
||||
test x"$trs_file" = x && missing_opts="$missing_opts --trs-file"
|
||||
if test x"$missing_opts" != x; then
|
||||
usage_error "the following mandatory options are missing:$missing_opts"
|
||||
fi
|
||||
|
||||
if test $# -eq 0; then
|
||||
usage_error "missing argument"
|
||||
fi
|
||||
|
||||
if test $color_tests = yes; then
|
||||
# Keep this in sync with 'lib/am/check.am:$(am__tty_colors)'.
|
||||
red='[0;31m' # Red.
|
||||
grn='[0;32m' # Green.
|
||||
lgn='[1;32m' # Light green.
|
||||
blu='[1;34m' # Blue.
|
||||
mgn='[0;35m' # Magenta.
|
||||
std='[m' # No color.
|
||||
else
|
||||
red= grn= lgn= blu= mgn= std=
|
||||
fi
|
||||
|
||||
do_exit='rm -f $log_file $trs_file; (exit $st); exit $st'
|
||||
trap "st=129; $do_exit" 1
|
||||
trap "st=130; $do_exit" 2
|
||||
trap "st=141; $do_exit" 13
|
||||
trap "st=143; $do_exit" 15
|
||||
|
||||
# Test script is run here.
|
||||
"$@" >$log_file 2>&1
|
||||
estatus=$?
|
||||
if test $enable_hard_errors = no && test $estatus -eq 99; then
|
||||
estatus=1
|
||||
fi
|
||||
|
||||
case $estatus:$expect_failure in
|
||||
0:yes) col=$red res=XPASS recheck=yes gcopy=yes;;
|
||||
0:*) col=$grn res=PASS recheck=no gcopy=no;;
|
||||
77:*) col=$blu res=SKIP recheck=no gcopy=yes;;
|
||||
99:*) col=$mgn res=ERROR recheck=yes gcopy=yes;;
|
||||
*:yes) col=$lgn res=XFAIL recheck=no gcopy=yes;;
|
||||
*:*) col=$red res=FAIL recheck=yes gcopy=yes;;
|
||||
esac
|
||||
|
||||
# Report outcome to console.
|
||||
echo "${col}${res}${std}: $test_name"
|
||||
|
||||
# Register the test result, and other relevant metadata.
|
||||
echo ":test-result: $res" > $trs_file
|
||||
echo ":global-test-result: $res" >> $trs_file
|
||||
echo ":recheck: $recheck" >> $trs_file
|
||||
echo ":copy-in-global-log: $gcopy" >> $trs_file
|
||||
|
||||
# Local Variables:
|
||||
# mode: shell-script
|
||||
# sh-indentation: 2
|
||||
# eval: (add-hook 'write-file-hooks 'time-stamp)
|
||||
# time-stamp-start: "scriptversion="
|
||||
# time-stamp-format: "%:y-%02m-%02d.%02H"
|
||||
# time-stamp-time-zone: "UTC"
|
||||
# time-stamp-end: "; # UTC"
|
||||
# End:
|
|
@ -1,7 +1,7 @@
|
|||
# GF-Complete 'test' AM file
|
||||
|
||||
INCLUDES=-I./ -I../include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
AM_CPPFLAGS = -I$(top_builddir)/include -I$(top_srcdir)/include
|
||||
AM_CFLAGS = -O3 -fPIC
|
||||
|
||||
bin_PROGRAMS = gf_unit
|
||||
|
||||
|
|
623
test/Makefile.in
|
@ -1,623 +0,0 @@
|
|||
# Makefile.in generated by automake 1.14.1 from Makefile.am.
|
||||
# @configure_input@
|
||||
|
||||
# Copyright (C) 1994-2013 Free Software Foundation, Inc.
|
||||
|
||||
# This Makefile.in is free software; the Free Software Foundation
|
||||
# gives unlimited permission to copy and/or distribute it,
|
||||
# with or without modifications, as long as this notice is preserved.
|
||||
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY, to the extent permitted by law; without
|
||||
# even the implied warranty of MERCHANTABILITY or FITNESS FOR A
|
||||
# PARTICULAR PURPOSE.
|
||||
|
||||
@SET_MAKE@
|
||||
|
||||
# GF-Complete 'test' AM file
|
||||
|
||||
VPATH = @srcdir@
|
||||
am__is_gnu_make = test -n '$(MAKEFILE_LIST)' && test -n '$(MAKELEVEL)'
|
||||
am__make_running_with_option = \
|
||||
case $${target_option-} in \
|
||||
?) ;; \
|
||||
*) echo "am__make_running_with_option: internal error: invalid" \
|
||||
"target option '$${target_option-}' specified" >&2; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
has_opt=no; \
|
||||
sane_makeflags=$$MAKEFLAGS; \
|
||||
if $(am__is_gnu_make); then \
|
||||
sane_makeflags=$$MFLAGS; \
|
||||
else \
|
||||
case $$MAKEFLAGS in \
|
||||
*\\[\ \ ]*) \
|
||||
bs=\\; \
|
||||
sane_makeflags=`printf '%s\n' "$$MAKEFLAGS" \
|
||||
| sed "s/$$bs$$bs[$$bs $$bs ]*//g"`;; \
|
||||
esac; \
|
||||
fi; \
|
||||
skip_next=no; \
|
||||
strip_trailopt () \
|
||||
{ \
|
||||
flg=`printf '%s\n' "$$flg" | sed "s/$$1.*$$//"`; \
|
||||
}; \
|
||||
for flg in $$sane_makeflags; do \
|
||||
test $$skip_next = yes && { skip_next=no; continue; }; \
|
||||
case $$flg in \
|
||||
*=*|--*) continue;; \
|
||||
-*I) strip_trailopt 'I'; skip_next=yes;; \
|
||||
-*I?*) strip_trailopt 'I';; \
|
||||
-*O) strip_trailopt 'O'; skip_next=yes;; \
|
||||
-*O?*) strip_trailopt 'O';; \
|
||||
-*l) strip_trailopt 'l'; skip_next=yes;; \
|
||||
-*l?*) strip_trailopt 'l';; \
|
||||
-[dEDm]) skip_next=yes;; \
|
||||
-[JT]) skip_next=yes;; \
|
||||
esac; \
|
||||
case $$flg in \
|
||||
*$$target_option*) has_opt=yes; break;; \
|
||||
esac; \
|
||||
done; \
|
||||
test $$has_opt = yes
|
||||
am__make_dryrun = (target_option=n; $(am__make_running_with_option))
|
||||
am__make_keepgoing = (target_option=k; $(am__make_running_with_option))
|
||||
pkgdatadir = $(datadir)/@PACKAGE@
|
||||
pkgincludedir = $(includedir)/@PACKAGE@
|
||||
pkglibdir = $(libdir)/@PACKAGE@
|
||||
pkglibexecdir = $(libexecdir)/@PACKAGE@
|
||||
am__cd = CDPATH="$${ZSH_VERSION+.}$(PATH_SEPARATOR)" && cd
|
||||
install_sh_DATA = $(install_sh) -c -m 644
|
||||
install_sh_PROGRAM = $(install_sh) -c
|
||||
install_sh_SCRIPT = $(install_sh) -c
|
||||
INSTALL_HEADER = $(INSTALL_DATA)
|
||||
transform = $(program_transform_name)
|
||||
NORMAL_INSTALL = :
|
||||
PRE_INSTALL = :
|
||||
POST_INSTALL = :
|
||||
NORMAL_UNINSTALL = :
|
||||
PRE_UNINSTALL = :
|
||||
POST_UNINSTALL = :
|
||||
build_triplet = @build@
|
||||
host_triplet = @host@
|
||||
bin_PROGRAMS = gf_unit$(EXEEXT)
|
||||
subdir = test
|
||||
DIST_COMMON = $(srcdir)/Makefile.in $(srcdir)/Makefile.am \
|
||||
$(top_srcdir)/depcomp
|
||||
ACLOCAL_M4 = $(top_srcdir)/aclocal.m4
|
||||
am__aclocal_m4_deps = $(top_srcdir)/m4/ax_check_compile_flag.m4 \
|
||||
$(top_srcdir)/m4/ax_ext.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_avx_xgetbv.m4 \
|
||||
$(top_srcdir)/m4/ax_gcc_x86_cpuid.m4 \
|
||||
$(top_srcdir)/m4/libtool.m4 $(top_srcdir)/m4/ltoptions.m4 \
|
||||
$(top_srcdir)/m4/ltsugar.m4 $(top_srcdir)/m4/ltversion.m4 \
|
||||
$(top_srcdir)/m4/lt~obsolete.m4 $(top_srcdir)/configure.ac
|
||||
am__configure_deps = $(am__aclocal_m4_deps) $(CONFIGURE_DEPENDENCIES) \
|
||||
$(ACLOCAL_M4)
|
||||
mkinstalldirs = $(install_sh) -d
|
||||
CONFIG_HEADER = $(top_builddir)/include/config.h
|
||||
CONFIG_CLEAN_FILES =
|
||||
CONFIG_CLEAN_VPATH_FILES =
|
||||
am__installdirs = "$(DESTDIR)$(bindir)"
|
||||
PROGRAMS = $(bin_PROGRAMS)
|
||||
am_gf_unit_OBJECTS = gf_unit.$(OBJEXT)
|
||||
gf_unit_OBJECTS = $(am_gf_unit_OBJECTS)
|
||||
gf_unit_DEPENDENCIES = ../src/libgf_complete.la
|
||||
AM_V_lt = $(am__v_lt_@AM_V@)
|
||||
am__v_lt_ = $(am__v_lt_@AM_DEFAULT_V@)
|
||||
am__v_lt_0 = --silent
|
||||
am__v_lt_1 =
|
||||
AM_V_P = $(am__v_P_@AM_V@)
|
||||
am__v_P_ = $(am__v_P_@AM_DEFAULT_V@)
|
||||
am__v_P_0 = false
|
||||
am__v_P_1 = :
|
||||
AM_V_GEN = $(am__v_GEN_@AM_V@)
|
||||
am__v_GEN_ = $(am__v_GEN_@AM_DEFAULT_V@)
|
||||
am__v_GEN_0 = @echo " GEN " $@;
|
||||
am__v_GEN_1 =
|
||||
AM_V_at = $(am__v_at_@AM_V@)
|
||||
am__v_at_ = $(am__v_at_@AM_DEFAULT_V@)
|
||||
am__v_at_0 = @
|
||||
am__v_at_1 =
|
||||
DEFAULT_INCLUDES = -I.@am__isrc@ -I$(top_builddir)/include
|
||||
depcomp = $(SHELL) $(top_srcdir)/depcomp
|
||||
am__depfiles_maybe = depfiles
|
||||
am__mv = mv -f
|
||||
COMPILE = $(CC) $(DEFS) $(DEFAULT_INCLUDES) $(INCLUDES) $(AM_CPPFLAGS) \
|
||||
$(CPPFLAGS) $(AM_CFLAGS) $(CFLAGS)
|
||||
LTCOMPILE = $(LIBTOOL) $(AM_V_lt) --tag=CC $(AM_LIBTOOLFLAGS) \
|
||||
$(LIBTOOLFLAGS) --mode=compile $(CC) $(DEFS) \
|
||||
$(DEFAULT_INCLUDES) $(INCLUDES) $(AM_CPPFLAGS) $(CPPFLAGS) \
|
||||
$(AM_CFLAGS) $(CFLAGS)
|
||||
AM_V_CC = $(am__v_CC_@AM_V@)
|
||||
am__v_CC_ = $(am__v_CC_@AM_DEFAULT_V@)
|
||||
am__v_CC_0 = @echo " CC " $@;
|
||||
am__v_CC_1 =
|
||||
CCLD = $(CC)
|
||||
LINK = $(LIBTOOL) $(AM_V_lt) --tag=CC $(AM_LIBTOOLFLAGS) \
|
||||
$(LIBTOOLFLAGS) --mode=link $(CCLD) $(AM_CFLAGS) $(CFLAGS) \
|
||||
$(AM_LDFLAGS) $(LDFLAGS) -o $@
|
||||
AM_V_CCLD = $(am__v_CCLD_@AM_V@)
|
||||
am__v_CCLD_ = $(am__v_CCLD_@AM_DEFAULT_V@)
|
||||
am__v_CCLD_0 = @echo " CCLD " $@;
|
||||
am__v_CCLD_1 =
|
||||
SOURCES = $(gf_unit_SOURCES)
|
||||
DIST_SOURCES = $(gf_unit_SOURCES)
|
||||
am__can_run_installinfo = \
|
||||
case $$AM_UPDATE_INFO_DIR in \
|
||||
n|no|NO) false;; \
|
||||
*) (install-info --version) >/dev/null 2>&1;; \
|
||||
esac
|
||||
am__tagged_files = $(HEADERS) $(SOURCES) $(TAGS_FILES) $(LISP)
|
||||
# Read a list of newline-separated strings from the standard input,
|
||||
# and print each of them once, without duplicates. Input order is
|
||||
# *not* preserved.
|
||||
am__uniquify_input = $(AWK) '\
|
||||
BEGIN { nonempty = 0; } \
|
||||
{ items[$$0] = 1; nonempty = 1; } \
|
||||
END { if (nonempty) { for (i in items) print i; }; } \
|
||||
'
|
||||
# Make sure the list of sources is unique. This is necessary because,
|
||||
# e.g., the same source file might be shared among _SOURCES variables
|
||||
# for different programs/libraries.
|
||||
am__define_uniq_tagged_files = \
|
||||
list='$(am__tagged_files)'; \
|
||||
unique=`for i in $$list; do \
|
||||
if test -f "$$i"; then echo $$i; else echo $(srcdir)/$$i; fi; \
|
||||
done | $(am__uniquify_input)`
|
||||
ETAGS = etags
|
||||
CTAGS = ctags
|
||||
DISTFILES = $(DIST_COMMON) $(DIST_SOURCES) $(TEXINFOS) $(EXTRA_DIST)
|
||||
ACLOCAL = @ACLOCAL@
|
||||
AMTAR = @AMTAR@
|
||||
AM_DEFAULT_VERBOSITY = @AM_DEFAULT_VERBOSITY@
|
||||
AR = @AR@
|
||||
AUTOCONF = @AUTOCONF@
|
||||
AUTOHEADER = @AUTOHEADER@
|
||||
AUTOMAKE = @AUTOMAKE@
|
||||
AWK = @AWK@
|
||||
CC = @CC@
|
||||
CCDEPMODE = @CCDEPMODE@
|
||||
CFLAGS = @CFLAGS@
|
||||
CPP = @CPP@
|
||||
CPPFLAGS = @CPPFLAGS@
|
||||
CYGPATH_W = @CYGPATH_W@
|
||||
DEFS = @DEFS@
|
||||
DEPDIR = @DEPDIR@
|
||||
DLLTOOL = @DLLTOOL@
|
||||
DSYMUTIL = @DSYMUTIL@
|
||||
DUMPBIN = @DUMPBIN@
|
||||
ECHO_C = @ECHO_C@
|
||||
ECHO_N = @ECHO_N@
|
||||
ECHO_T = @ECHO_T@
|
||||
EGREP = @EGREP@
|
||||
EXEEXT = @EXEEXT@
|
||||
FGREP = @FGREP@
|
||||
GREP = @GREP@
|
||||
INSTALL = @INSTALL@
|
||||
INSTALL_DATA = @INSTALL_DATA@
|
||||
INSTALL_PROGRAM = @INSTALL_PROGRAM@
|
||||
INSTALL_SCRIPT = @INSTALL_SCRIPT@
|
||||
INSTALL_STRIP_PROGRAM = @INSTALL_STRIP_PROGRAM@
|
||||
LD = @LD@
|
||||
LDFLAGS = @LDFLAGS@
|
||||
LIBOBJS = @LIBOBJS@
|
||||
LIBS = @LIBS@
|
||||
LIBTOOL = @LIBTOOL@
|
||||
LIPO = @LIPO@
|
||||
LN_S = @LN_S@
|
||||
LTLIBOBJS = @LTLIBOBJS@
|
||||
MAINT = @MAINT@
|
||||
MAKEINFO = @MAKEINFO@
|
||||
MANIFEST_TOOL = @MANIFEST_TOOL@
|
||||
MKDIR_P = @MKDIR_P@
|
||||
NM = @NM@
|
||||
NMEDIT = @NMEDIT@
|
||||
OBJDUMP = @OBJDUMP@
|
||||
OBJEXT = @OBJEXT@
|
||||
OTOOL = @OTOOL@
|
||||
OTOOL64 = @OTOOL64@
|
||||
PACKAGE = @PACKAGE@
|
||||
PACKAGE_BUGREPORT = @PACKAGE_BUGREPORT@
|
||||
PACKAGE_NAME = @PACKAGE_NAME@
|
||||
PACKAGE_STRING = @PACKAGE_STRING@
|
||||
PACKAGE_TARNAME = @PACKAGE_TARNAME@
|
||||
PACKAGE_URL = @PACKAGE_URL@
|
||||
PACKAGE_VERSION = @PACKAGE_VERSION@
|
||||
PATH_SEPARATOR = @PATH_SEPARATOR@
|
||||
RANLIB = @RANLIB@
|
||||
SED = @SED@
|
||||
SET_MAKE = @SET_MAKE@
|
||||
SHELL = @SHELL@
|
||||
SIMD_FLAGS = @SIMD_FLAGS@
|
||||
STRIP = @STRIP@
|
||||
VERSION = @VERSION@
|
||||
abs_builddir = @abs_builddir@
|
||||
abs_srcdir = @abs_srcdir@
|
||||
abs_top_builddir = @abs_top_builddir@
|
||||
abs_top_srcdir = @abs_top_srcdir@
|
||||
ac_ct_AR = @ac_ct_AR@
|
||||
ac_ct_CC = @ac_ct_CC@
|
||||
ac_ct_DUMPBIN = @ac_ct_DUMPBIN@
|
||||
am__include = @am__include@
|
||||
am__leading_dot = @am__leading_dot@
|
||||
am__quote = @am__quote@
|
||||
am__tar = @am__tar@
|
||||
am__untar = @am__untar@
|
||||
bindir = @bindir@
|
||||
build = @build@
|
||||
build_alias = @build_alias@
|
||||
build_cpu = @build_cpu@
|
||||
build_os = @build_os@
|
||||
build_vendor = @build_vendor@
|
||||
builddir = @builddir@
|
||||
datadir = @datadir@
|
||||
datarootdir = @datarootdir@
|
||||
docdir = @docdir@
|
||||
dvidir = @dvidir@
|
||||
exec_prefix = @exec_prefix@
|
||||
host = @host@
|
||||
host_alias = @host_alias@
|
||||
host_cpu = @host_cpu@
|
||||
host_os = @host_os@
|
||||
host_vendor = @host_vendor@
|
||||
htmldir = @htmldir@
|
||||
includedir = @includedir@
|
||||
infodir = @infodir@
|
||||
install_sh = @install_sh@
|
||||
libdir = @libdir@
|
||||
libexecdir = @libexecdir@
|
||||
localedir = @localedir@
|
||||
localstatedir = @localstatedir@
|
||||
mandir = @mandir@
|
||||
mkdir_p = @mkdir_p@
|
||||
oldincludedir = @oldincludedir@
|
||||
pdfdir = @pdfdir@
|
||||
prefix = @prefix@
|
||||
program_transform_name = @program_transform_name@
|
||||
psdir = @psdir@
|
||||
sbindir = @sbindir@
|
||||
sharedstatedir = @sharedstatedir@
|
||||
srcdir = @srcdir@
|
||||
sysconfdir = @sysconfdir@
|
||||
target_alias = @target_alias@
|
||||
top_build_prefix = @top_build_prefix@
|
||||
top_builddir = @top_builddir@
|
||||
top_srcdir = @top_srcdir@
|
||||
INCLUDES = -I./ -I../include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
gf_unit_SOURCES = gf_unit.c
|
||||
#gf_unit_LDFLAGS = -lgf_complete
|
||||
gf_unit_LDADD = ../src/libgf_complete.la
|
||||
all: all-am
|
||||
|
||||
.SUFFIXES:
|
||||
.SUFFIXES: .c .lo .o .obj
|
||||
$(srcdir)/Makefile.in: @MAINTAINER_MODE_TRUE@ $(srcdir)/Makefile.am $(am__configure_deps)
|
||||
@for dep in $?; do \
|
||||
case '$(am__configure_deps)' in \
|
||||
*$$dep*) \
|
||||
( cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh ) \
|
||||
&& { if test -f $@; then exit 0; else break; fi; }; \
|
||||
exit 1;; \
|
||||
esac; \
|
||||
done; \
|
||||
echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu test/Makefile'; \
|
||||
$(am__cd) $(top_srcdir) && \
|
||||
$(AUTOMAKE) --gnu test/Makefile
|
||||
.PRECIOUS: Makefile
|
||||
Makefile: $(srcdir)/Makefile.in $(top_builddir)/config.status
|
||||
@case '$?' in \
|
||||
*config.status*) \
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh;; \
|
||||
*) \
|
||||
echo ' cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe)'; \
|
||||
cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe);; \
|
||||
esac;
|
||||
|
||||
$(top_builddir)/config.status: $(top_srcdir)/configure $(CONFIG_STATUS_DEPENDENCIES)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
|
||||
$(top_srcdir)/configure: @MAINTAINER_MODE_TRUE@ $(am__configure_deps)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
$(ACLOCAL_M4): @MAINTAINER_MODE_TRUE@ $(am__aclocal_m4_deps)
|
||||
cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh
|
||||
$(am__aclocal_m4_deps):
|
||||
install-binPROGRAMS: $(bin_PROGRAMS)
|
||||
@$(NORMAL_INSTALL)
|
||||
@list='$(bin_PROGRAMS)'; test -n "$(bindir)" || list=; \
|
||||
if test -n "$$list"; then \
|
||||
echo " $(MKDIR_P) '$(DESTDIR)$(bindir)'"; \
|
||||
$(MKDIR_P) "$(DESTDIR)$(bindir)" || exit 1; \
|
||||
fi; \
|
||||
for p in $$list; do echo "$$p $$p"; done | \
|
||||
sed 's/$(EXEEXT)$$//' | \
|
||||
while read p p1; do if test -f $$p \
|
||||
|| test -f $$p1 \
|
||||
; then echo "$$p"; echo "$$p"; else :; fi; \
|
||||
done | \
|
||||
sed -e 'p;s,.*/,,;n;h' \
|
||||
-e 's|.*|.|' \
|
||||
-e 'p;x;s,.*/,,;s/$(EXEEXT)$$//;$(transform);s/$$/$(EXEEXT)/' | \
|
||||
sed 'N;N;N;s,\n, ,g' | \
|
||||
$(AWK) 'BEGIN { files["."] = ""; dirs["."] = 1 } \
|
||||
{ d=$$3; if (dirs[d] != 1) { print "d", d; dirs[d] = 1 } \
|
||||
if ($$2 == $$4) files[d] = files[d] " " $$1; \
|
||||
else { print "f", $$3 "/" $$4, $$1; } } \
|
||||
END { for (d in files) print "f", d, files[d] }' | \
|
||||
while read type dir files; do \
|
||||
if test "$$dir" = .; then dir=; else dir=/$$dir; fi; \
|
||||
test -z "$$files" || { \
|
||||
echo " $(INSTALL_PROGRAM_ENV) $(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=install $(INSTALL_PROGRAM) $$files '$(DESTDIR)$(bindir)$$dir'"; \
|
||||
$(INSTALL_PROGRAM_ENV) $(LIBTOOL) $(AM_LIBTOOLFLAGS) $(LIBTOOLFLAGS) --mode=install $(INSTALL_PROGRAM) $$files "$(DESTDIR)$(bindir)$$dir" || exit $$?; \
|
||||
} \
|
||||
; done
|
||||
|
||||
uninstall-binPROGRAMS:
|
||||
@$(NORMAL_UNINSTALL)
|
||||
@list='$(bin_PROGRAMS)'; test -n "$(bindir)" || list=; \
|
||||
files=`for p in $$list; do echo "$$p"; done | \
|
||||
sed -e 'h;s,^.*/,,;s/$(EXEEXT)$$//;$(transform)' \
|
||||
-e 's/$$/$(EXEEXT)/' \
|
||||
`; \
|
||||
test -n "$$list" || exit 0; \
|
||||
echo " ( cd '$(DESTDIR)$(bindir)' && rm -f" $$files ")"; \
|
||||
cd "$(DESTDIR)$(bindir)" && rm -f $$files
|
||||
|
||||
clean-binPROGRAMS:
|
||||
@list='$(bin_PROGRAMS)'; test -n "$$list" || exit 0; \
|
||||
echo " rm -f" $$list; \
|
||||
rm -f $$list || exit $$?; \
|
||||
test -n "$(EXEEXT)" || exit 0; \
|
||||
list=`for p in $$list; do echo "$$p"; done | sed 's/$(EXEEXT)$$//'`; \
|
||||
echo " rm -f" $$list; \
|
||||
rm -f $$list
|
||||
|
||||
gf_unit$(EXEEXT): $(gf_unit_OBJECTS) $(gf_unit_DEPENDENCIES) $(EXTRA_gf_unit_DEPENDENCIES)
|
||||
@rm -f gf_unit$(EXEEXT)
|
||||
$(AM_V_CCLD)$(LINK) $(gf_unit_OBJECTS) $(gf_unit_LDADD) $(LIBS)
|
||||
|
||||
mostlyclean-compile:
|
||||
-rm -f *.$(OBJEXT)
|
||||
|
||||
distclean-compile:
|
||||
-rm -f *.tab.c
|
||||
|
||||
@AMDEP_TRUE@@am__include@ @am__quote@./$(DEPDIR)/gf_unit.Po@am__quote@
|
||||
|
||||
.c.o:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(COMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ $<
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Po
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=no @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(COMPILE) -c -o $@ $<
|
||||
|
||||
.c.obj:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(COMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ `$(CYGPATH_W) '$<'`
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Po
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=no @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(COMPILE) -c -o $@ `$(CYGPATH_W) '$<'`
|
||||
|
||||
.c.lo:
|
||||
@am__fastdepCC_TRUE@ $(AM_V_CC)$(LTCOMPILE) -MT $@ -MD -MP -MF $(DEPDIR)/$*.Tpo -c -o $@ $<
|
||||
@am__fastdepCC_TRUE@ $(AM_V_at)$(am__mv) $(DEPDIR)/$*.Tpo $(DEPDIR)/$*.Plo
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ $(AM_V_CC)source='$<' object='$@' libtool=yes @AMDEPBACKSLASH@
|
||||
@AMDEP_TRUE@@am__fastdepCC_FALSE@ DEPDIR=$(DEPDIR) $(CCDEPMODE) $(depcomp) @AMDEPBACKSLASH@
|
||||
@am__fastdepCC_FALSE@ $(AM_V_CC@am__nodep@)$(LTCOMPILE) -c -o $@ $<
|
||||
|
||||
mostlyclean-libtool:
|
||||
-rm -f *.lo
|
||||
|
||||
clean-libtool:
|
||||
-rm -rf .libs _libs
|
||||
|
||||
ID: $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); mkid -fID $$unique
|
||||
tags: tags-am
|
||||
TAGS: tags
|
||||
|
||||
tags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
set x; \
|
||||
here=`pwd`; \
|
||||
$(am__define_uniq_tagged_files); \
|
||||
shift; \
|
||||
if test -z "$(ETAGS_ARGS)$$*$$unique"; then :; else \
|
||||
test -n "$$unique" || unique=$$empty_fix; \
|
||||
if test $$# -gt 0; then \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
"$$@" $$unique; \
|
||||
else \
|
||||
$(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
|
||||
$$unique; \
|
||||
fi; \
|
||||
fi
|
||||
ctags: ctags-am
|
||||
|
||||
CTAGS: ctags
|
||||
ctags-am: $(TAGS_DEPENDENCIES) $(am__tagged_files)
|
||||
$(am__define_uniq_tagged_files); \
|
||||
test -z "$(CTAGS_ARGS)$$unique" \
|
||||
|| $(CTAGS) $(CTAGSFLAGS) $(AM_CTAGSFLAGS) $(CTAGS_ARGS) \
|
||||
$$unique
|
||||
|
||||
GTAGS:
|
||||
here=`$(am__cd) $(top_builddir) && pwd` \
|
||||
&& $(am__cd) $(top_srcdir) \
|
||||
&& gtags -i $(GTAGS_ARGS) "$$here"
|
||||
cscopelist: cscopelist-am
|
||||
|
||||
cscopelist-am: $(am__tagged_files)
|
||||
list='$(am__tagged_files)'; \
|
||||
case "$(srcdir)" in \
|
||||
[\\/]* | ?:[\\/]*) sdir="$(srcdir)" ;; \
|
||||
*) sdir=$(subdir)/$(srcdir) ;; \
|
||||
esac; \
|
||||
for i in $$list; do \
|
||||
if test -f "$$i"; then \
|
||||
echo "$(subdir)/$$i"; \
|
||||
else \
|
||||
echo "$$sdir/$$i"; \
|
||||
fi; \
|
||||
done >> $(top_builddir)/cscope.files
|
||||
|
||||
distclean-tags:
|
||||
-rm -f TAGS ID GTAGS GRTAGS GSYMS GPATH tags
|
||||
|
||||
distdir: $(DISTFILES)
|
||||
@srcdirstrip=`echo "$(srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
topsrcdirstrip=`echo "$(top_srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
|
||||
list='$(DISTFILES)'; \
|
||||
dist_files=`for file in $$list; do echo $$file; done | \
|
||||
sed -e "s|^$$srcdirstrip/||;t" \
|
||||
-e "s|^$$topsrcdirstrip/|$(top_builddir)/|;t"`; \
|
||||
case $$dist_files in \
|
||||
*/*) $(MKDIR_P) `echo "$$dist_files" | \
|
||||
sed '/\//!d;s|^|$(distdir)/|;s,/[^/]*$$,,' | \
|
||||
sort -u` ;; \
|
||||
esac; \
|
||||
for file in $$dist_files; do \
|
||||
if test -f $$file || test -d $$file; then d=.; else d=$(srcdir); fi; \
|
||||
if test -d $$d/$$file; then \
|
||||
dir=`echo "/$$file" | sed -e 's,/[^/]*$$,,'`; \
|
||||
if test -d "$(distdir)/$$file"; then \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
if test -d $(srcdir)/$$file && test $$d != $(srcdir); then \
|
||||
cp -fpR $(srcdir)/$$file "$(distdir)$$dir" || exit 1; \
|
||||
find "$(distdir)/$$file" -type d ! -perm -700 -exec chmod u+rwx {} \;; \
|
||||
fi; \
|
||||
cp -fpR $$d/$$file "$(distdir)$$dir" || exit 1; \
|
||||
else \
|
||||
test -f "$(distdir)/$$file" \
|
||||
|| cp -p $$d/$$file "$(distdir)/$$file" \
|
||||
|| exit 1; \
|
||||
fi; \
|
||||
done
|
||||
check-am: all-am
|
||||
check: check-am
|
||||
all-am: Makefile $(PROGRAMS)
|
||||
installdirs:
|
||||
for dir in "$(DESTDIR)$(bindir)"; do \
|
||||
test -z "$$dir" || $(MKDIR_P) "$$dir"; \
|
||||
done
|
||||
install: install-am
|
||||
install-exec: install-exec-am
|
||||
install-data: install-data-am
|
||||
uninstall: uninstall-am
|
||||
|
||||
install-am: all-am
|
||||
@$(MAKE) $(AM_MAKEFLAGS) install-exec-am install-data-am
|
||||
|
||||
installcheck: installcheck-am
|
||||
install-strip:
|
||||
if test -z '$(STRIP)'; then \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
install; \
|
||||
else \
|
||||
$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
|
||||
install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
|
||||
"INSTALL_PROGRAM_ENV=STRIPPROG='$(STRIP)'" install; \
|
||||
fi
|
||||
mostlyclean-generic:
|
||||
|
||||
clean-generic:
|
||||
|
||||
distclean-generic:
|
||||
-test -z "$(CONFIG_CLEAN_FILES)" || rm -f $(CONFIG_CLEAN_FILES)
|
||||
-test . = "$(srcdir)" || test -z "$(CONFIG_CLEAN_VPATH_FILES)" || rm -f $(CONFIG_CLEAN_VPATH_FILES)
|
||||
|
||||
maintainer-clean-generic:
|
||||
@echo "This command is intended for maintainers to use"
|
||||
@echo "it deletes files that may require special tools to rebuild."
|
||||
clean: clean-am
|
||||
|
||||
clean-am: clean-binPROGRAMS clean-generic clean-libtool mostlyclean-am
|
||||
|
||||
distclean: distclean-am
|
||||
-rm -rf ./$(DEPDIR)
|
||||
-rm -f Makefile
|
||||
distclean-am: clean-am distclean-compile distclean-generic \
|
||||
distclean-tags
|
||||
|
||||
dvi: dvi-am
|
||||
|
||||
dvi-am:
|
||||
|
||||
html: html-am
|
||||
|
||||
html-am:
|
||||
|
||||
info: info-am
|
||||
|
||||
info-am:
|
||||
|
||||
install-data-am:
|
||||
|
||||
install-dvi: install-dvi-am
|
||||
|
||||
install-dvi-am:
|
||||
|
||||
install-exec-am: install-binPROGRAMS
|
||||
|
||||
install-html: install-html-am
|
||||
|
||||
install-html-am:
|
||||
|
||||
install-info: install-info-am
|
||||
|
||||
install-info-am:
|
||||
|
||||
install-man:
|
||||
|
||||
install-pdf: install-pdf-am
|
||||
|
||||
install-pdf-am:
|
||||
|
||||
install-ps: install-ps-am
|
||||
|
||||
install-ps-am:
|
||||
|
||||
installcheck-am:
|
||||
|
||||
maintainer-clean: maintainer-clean-am
|
||||
-rm -rf ./$(DEPDIR)
|
||||
-rm -f Makefile
|
||||
maintainer-clean-am: distclean-am maintainer-clean-generic
|
||||
|
||||
mostlyclean: mostlyclean-am
|
||||
|
||||
mostlyclean-am: mostlyclean-compile mostlyclean-generic \
|
||||
mostlyclean-libtool
|
||||
|
||||
pdf: pdf-am
|
||||
|
||||
pdf-am:
|
||||
|
||||
ps: ps-am
|
||||
|
||||
ps-am:
|
||||
|
||||
uninstall-am: uninstall-binPROGRAMS
|
||||
|
||||
.MAKE: install-am install-strip
|
||||
|
||||
.PHONY: CTAGS GTAGS TAGS all all-am check check-am clean \
|
||||
clean-binPROGRAMS clean-generic clean-libtool cscopelist-am \
|
||||
ctags ctags-am distclean distclean-compile distclean-generic \
|
||||
distclean-libtool distclean-tags distdir dvi dvi-am html \
|
||||
html-am info info-am install install-am install-binPROGRAMS \
|
||||
install-data install-data-am install-dvi install-dvi-am \
|
||||
install-exec install-exec-am install-html install-html-am \
|
||||
install-info install-info-am install-man install-pdf \
|
||||
install-pdf-am install-ps install-ps-am install-strip \
|
||||
installcheck installcheck-am installdirs maintainer-clean \
|
||||
maintainer-clean-generic mostlyclean mostlyclean-compile \
|
||||
mostlyclean-generic mostlyclean-libtool pdf pdf-am ps ps-am \
|
||||
tags tags-am uninstall uninstall-am uninstall-binPROGRAMS
|
||||
|
||||
|
||||
# Tell versions [3.59,3.63) of GNU make to not export all variables.
|
||||
# Otherwise a system limit (for SysV at least) may be exceeded.
|
||||
.NOEXPORT:
|
|
@ -8,6 +8,14 @@
|
|||
* Performs unit testing for gf arithmetic
|
||||
*/
|
||||
|
||||
#include "config.h"
|
||||
|
||||
#ifdef HAVE_POSIX_MEMALIGN
|
||||
#ifndef _XOPEN_SOURCE
|
||||
#define _XOPEN_SOURCE 600
|
||||
#endif
|
||||
#endif
|
||||
|
||||
#include <stdio.h>
|
||||
#include <getopt.h>
|
||||
#include <stdint.h>
|
||||
|
@ -82,6 +90,9 @@ int main(int argc, char **argv)
|
|||
uint32_t mask = 0;
|
||||
char *ra, *rb, *rc, *rd, *target;
|
||||
int align;
|
||||
#ifndef HAVE_POSIX_MEMALIGN
|
||||
char *malloc_ra, *malloc_rb, *malloc_rc, *malloc_rd;
|
||||
#endif
|
||||
|
||||
|
||||
if (argc < 4) usage(NULL);
|
||||
|
@ -116,18 +127,26 @@ int main(int argc, char **argv)
|
|||
c = (gf_general_t *) malloc(sizeof(gf_general_t));
|
||||
d = (gf_general_t *) malloc(sizeof(gf_general_t));
|
||||
|
||||
#if HAVE_POSIX_MEMALIGN
|
||||
if (posix_memalign((void **) &ra, 16, sizeof(char)*REGION_SIZE))
|
||||
ra = NULL;
|
||||
if (posix_memalign((void **) &rb, 16, sizeof(char)*REGION_SIZE))
|
||||
rb = NULL;
|
||||
if (posix_memalign((void **) &rc, 16, sizeof(char)*REGION_SIZE))
|
||||
rc = NULL;
|
||||
if (posix_memalign((void **) &rd, 16, sizeof(char)*REGION_SIZE))
|
||||
rd = NULL;
|
||||
#else
|
||||
//15 bytes extra to make sure it's 16byte aligned
|
||||
ra = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
rb = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
rc = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
rd = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
|
||||
//this still assumes 8 byte aligned pointer from malloc
|
||||
//(which is usual on 32-bit machines)
|
||||
ra += (uint64_t)ra & 0xf;
|
||||
rb += (uint64_t)rb & 0xf;
|
||||
rc += (uint64_t)rc & 0xf;
|
||||
rd += (uint64_t)rd & 0xf;
|
||||
malloc_ra = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
malloc_rb = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
malloc_rc = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
malloc_rd = (char *) malloc(sizeof(char)*REGION_SIZE+15);
|
||||
ra = (uint8_t *) (((uintptr_t) malloc_ra + 15) & ~((uintptr_t) 0xf));
|
||||
rb = (uint8_t *) (((uintptr_t) malloc_rb + 15) & ~((uintptr_t) 0xf));
|
||||
rc = (uint8_t *) (((uintptr_t) malloc_rc + 15) & ~((uintptr_t) 0xf));
|
||||
rd = (uint8_t *) (((uintptr_t) malloc_rd + 15) & ~((uintptr_t) 0xf));
|
||||
#endif
|
||||
|
||||
if (w <= 32) {
|
||||
mask = 0;
|
||||
|
@ -141,15 +160,12 @@ int main(int argc, char **argv)
|
|||
if (!gf_init_hard(&gf_def, w, GF_MULT_DEFAULT, GF_REGION_DEFAULT, GF_DIVIDE_DEFAULT,
|
||||
(h->mult_type != GF_MULT_COMPOSITE) ? h->prim_poly : 0, 0, 0, NULL, NULL))
|
||||
problem("No default for this value of w");
|
||||
|
||||
if (w == 4) {
|
||||
mult4 = gf_w4_get_mult_table(&gf);
|
||||
}
|
||||
|
||||
if (w == 8) {
|
||||
} else if (w == 8) {
|
||||
mult8 = gf_w8_get_mult_table(&gf);
|
||||
}
|
||||
|
||||
if (w == 16) {
|
||||
} else if (w == 16) {
|
||||
log16 = gf_w16_get_log_table(&gf);
|
||||
alog16 = gf_w16_get_mult_alog_table(&gf);
|
||||
}
|
||||
|
@ -308,7 +324,6 @@ int main(int argc, char **argv)
|
|||
gf_general_val_to_s(c, w, cs, 1);
|
||||
printf("Error in single multiplication (all numbers in hex):\n\n");
|
||||
printf(" gf.multiply(gf, %s, %s) = %s, which is clearly wrong.\n", as, bs, cs);
|
||||
;
|
||||
exit(1);
|
||||
}
|
||||
}
|
||||
|
@ -422,5 +437,22 @@ int main(int argc, char **argv)
|
|||
gf_general_do_region_check(&gf, a, rc+s_start, rd+d_start, target+d_start, bytes, xor);
|
||||
}
|
||||
}
|
||||
|
||||
free(a);
|
||||
free(b);
|
||||
free(c);
|
||||
free(d);
|
||||
#ifdef HAVE_POSIX_MEMALIGN
|
||||
free(ra);
|
||||
free(rb);
|
||||
free(rc);
|
||||
free(rd);
|
||||
#else
|
||||
free(malloc_ra);
|
||||
free(malloc_rb);
|
||||
free(malloc_rc);
|
||||
free(malloc_rd);
|
||||
#endif
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
|
|
@ -1,9 +1,7 @@
|
|||
# GF-Complete 'tools' AM file
|
||||
|
||||
INCLUDES=-I./ -I../include
|
||||
AM_CFLAGS = -O3 $(SIMD_FLAGS) -fPIC $(INCLUDES)
|
||||
|
||||
TESTS=run-tests.sh
|
||||
AM_CPPFLAGS = -I$(top_builddir)/include -I$(top_srcdir)/include
|
||||
AM_CFLAGS = -O3 -fPIC
|
||||
|
||||
bin_PROGRAMS = gf_mult gf_div gf_add gf_time gf_methods gf_poly gf_inline_time
|
||||
|
||||
|
@ -35,3 +33,24 @@ gf_inline_time_SOURCES = gf_inline_time.c
|
|||
#gf_inline_time_LDFLAGS = -lgf_complete
|
||||
gf_inline_time_LDADD = ../src/libgf_complete.la
|
||||
|
||||
# gf_unit 8 A -1 -m LOG_ZERO_EXT is excluded until http://lab.jerasure.org/jerasure/gf-complete/issues/13 is resolved
|
||||
if ENABLE_VALGRIND
|
||||
VALGRIND = | perl -p -e 's|^|../libtool --mode=execute valgrind --quiet --error-exitcode=1 --tool=memcheck | if(!/gf_unit 8 A -1 -m LOG_ZERO_EXT/)'
|
||||
endif
|
||||
|
||||
# gf_unit tests as generated by gf_methods
|
||||
gf_unit_w%.sh: gf_methods
|
||||
./$^ $(@:gf_unit_w%.sh=%) -A -U ${VALGRIND} > $@ || rm $@
|
||||
|
||||
TESTS = gf_unit_w128.sh \
|
||||
gf_unit_w64.sh \
|
||||
gf_unit_w32.sh \
|
||||
gf_unit_w16.sh \
|
||||
gf_unit_w8.sh \
|
||||
gf_unit_w4.sh
|
||||
|
||||
TEST_EXTENSIONS = .sh
|
||||
SH_LOG_COMPILER = $(SHELL)
|
||||
AM_SH_LOG_FLAGS = -e
|
||||
|
||||
CLEANFILES = $(TESTS)
|
||||
|
|
1068
tools/Makefile.in
|
@ -116,8 +116,7 @@ int main(int argc, char **argv)
|
|||
printf("Inline mult: %10.6lf s Mops: %10.3lf %10.3lf Mega-ops/s\n",
|
||||
elapsed, dnum/1024.0/1024.0, dnum/1024.0/1024.0/elapsed);
|
||||
|
||||
}
|
||||
if (w == 8) {
|
||||
} else if (w == 8) {
|
||||
mult8 = gf_w8_get_mult_table(&gf);
|
||||
if (mult8 == NULL) {
|
||||
printf("Couldn't get inline multiplication table.\n");
|
||||
|
@ -139,8 +138,7 @@ int main(int argc, char **argv)
|
|||
}
|
||||
printf("Inline mult: %10.6lf s Mops: %10.3lf %10.3lf Mega-ops/s\n",
|
||||
elapsed, dnum/1024.0/1024.0, dnum/1024.0/1024.0/elapsed);
|
||||
}
|
||||
if (w == 16) {
|
||||
} else if (w == 16) {
|
||||
log16 = gf_w16_get_log_table(&gf);
|
||||
alog16 = gf_w16_get_mult_alog_table(&gf);
|
||||
if (log16 == NULL) {
|
||||
|
@ -164,5 +162,9 @@ int main(int argc, char **argv)
|
|||
printf("Inline mult: %10.6lf s Mops: %10.3lf %10.3lf Mega-ops/s\n",
|
||||
elapsed, dnum/1024.0/1024.0, dnum/1024.0/1024.0/elapsed);
|
||||
}
|
||||
free (ra);
|
||||
free (rb);
|
||||
free (ra16);
|
||||
free (rb16);
|
||||
return 0;
|
||||
}
|
||||
|
|
|
@ -20,7 +20,6 @@
|
|||
#define BNMULTS (8)
|
||||
static char *BMULTS[BNMULTS] = { "CARRY_FREE", "GROUP48",
|
||||
"TABLE", "LOG", "SPLIT4", "SPLIT8", "SPLIT88", "COMPOSITE" };
|
||||
//ADAM
|
||||
#define NMULTS (17)
|
||||
static char *MULTS[NMULTS] = { "SHIFT", "CARRY_FREE", "CARRY_FREE_GK", "GROUP44", "GROUP48", "BYTWO_p", "BYTWO_b",
|
||||
"TABLE", "LOG", "LOG_ZERO", "LOG_ZERO_EXT", "SPLIT2",
|
||||
|
@ -29,7 +28,7 @@ static char *MULTS[NMULTS] = { "SHIFT", "CARRY_FREE", "CARRY_FREE_GK", "GROUP44"
|
|||
/* Make sure CAUCHY is last */
|
||||
|
||||
#define NREGIONS (7)
|
||||
static char *REGIONS[NREGIONS] = { "DOUBLE", "QUAD", "LAZY", "SSE", "NOSSE",
|
||||
static char *REGIONS[NREGIONS] = { "DOUBLE", "QUAD", "LAZY", "SIMD", "NOSIMD",
|
||||
"ALTMAP", "CAUCHY" };
|
||||
|
||||
#define BNREGIONS (4)
|
||||
|
@ -40,7 +39,7 @@ static char *divides[NDIVS] = { "MATRIX", "EUCLID" };
|
|||
|
||||
void usage(char *s)
|
||||
{
|
||||
fprintf(stderr, "usage: gf_methods w -BADC -LUMDRB\n");
|
||||
fprintf(stderr, "usage: gf_methods w -BADC -LXUMDRB\n");
|
||||
fprintf(stderr, "\n");
|
||||
fprintf(stderr, " w can be 1-32, 64, 128\n");
|
||||
fprintf(stderr, "\n");
|
||||
|
@ -51,6 +50,7 @@ void usage(char *s)
|
|||
fprintf(stderr, " Combinations are fine.\n");
|
||||
fprintf(stderr, "\n");
|
||||
fprintf(stderr, " -L Simply lists methods\n");
|
||||
fprintf(stderr, " -X List methods and functions selected (compile with DEBUG_FUNCTIONS)\n");
|
||||
fprintf(stderr, " -U Produces calls to gf_unit\n");
|
||||
fprintf(stderr, " -M Produces calls to time_tool.sh for single multiplications\n");
|
||||
fprintf(stderr, " -D Produces calls to time_tool.sh for single divisions\n");
|
||||
|
@ -64,6 +64,19 @@ void usage(char *s)
|
|||
exit(1);
|
||||
}
|
||||
|
||||
void print_methods(gf_t *gf)
|
||||
{
|
||||
#ifdef DEBUG_FUNCTIONS
|
||||
gf_internal_t *h = (gf_internal_t*) gf->scratch;
|
||||
|
||||
printf("multiply = %s\n", h->multiply);
|
||||
printf("divide = %s\n", h->divide);
|
||||
printf("inverse = %s\n", h->inverse);
|
||||
printf("multiply_region = %s\n", h->multiply_region);
|
||||
printf("extract_word = %s\n", h->extract_word);
|
||||
#endif
|
||||
}
|
||||
|
||||
int main(int argc, char *argv[])
|
||||
{
|
||||
int m, r, d, w, i, sa, j, k, reset, ok;
|
||||
|
@ -100,12 +113,12 @@ int main(int argc, char *argv[])
|
|||
}
|
||||
}
|
||||
|
||||
if (strchr("LUMDRB", argv[3][1]) == NULL) { usage("Bad -LUMDRB"); }
|
||||
if (strchr("LXUMDRB", argv[3][1]) == NULL) { usage("Bad -LXUMDRB"); }
|
||||
listing = argv[3][1];
|
||||
|
||||
if (listing == 'U') {
|
||||
w_str = "../test/gf_unit %d A -1";
|
||||
} else if (listing == 'L') {
|
||||
} else if (listing == 'L' || listing == 'X') {
|
||||
w_str = "w=%d:";
|
||||
} else {
|
||||
w_str = strdup("sh time_tool.sh X %d");
|
||||
|
@ -193,6 +206,8 @@ int main(int argc, char *argv[])
|
|||
printf(w_str, w);
|
||||
for (j = 0; j < sa; j++) printf(" %s", gf_argv[j]);
|
||||
printf("\n");
|
||||
if (listing == 'X')
|
||||
print_methods(&gf);
|
||||
gf_free(&gf, 1);
|
||||
} else if (_gf_errno == GF_E_DEFAULT) {
|
||||
fprintf(stderr, "Unlabeled failed method: w=%d:", w);
|
||||
|
@ -213,6 +228,8 @@ int main(int argc, char *argv[])
|
|||
printf(w_str, w);
|
||||
for (j = 0; j < sa; j++) printf(" %s", gf_argv[j]);
|
||||
printf("\n");
|
||||
if (listing == 'X')
|
||||
print_methods(&gf);
|
||||
gf_free(&gf, 1);
|
||||
} else if (_gf_errno == GF_E_DEFAULT) {
|
||||
fprintf(stderr, "Unlabeled failed method: w=%d:", w);
|
||||
|
|
|
@ -52,6 +52,7 @@
|
|||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
#include <assert.h>
|
||||
|
||||
char *BM = "Bad Method: ";
|
||||
|
||||
|
@ -203,9 +204,14 @@ int main(int argc, char **argv)
|
|||
sprintf(string, "Argument '%s' not in proper format of power:coefficient\n", argv[i]);
|
||||
usage(string);
|
||||
}
|
||||
if (power < 0) usage("Can't have negative powers\n");
|
||||
if (power > n) n = power;
|
||||
if (power < 0) {
|
||||
usage("Can't have negative powers\n");
|
||||
} else {
|
||||
n = power;
|
||||
}
|
||||
}
|
||||
// in case the for-loop header fails
|
||||
assert (n >= 0);
|
||||
|
||||
poly = (gf_general_t *) malloc(sizeof(gf_general_t)*(n+1));
|
||||
for (i = 0; i <= n; i++) gf_general_set_zero(poly+i, w);
|
||||
|
|
|
@ -8,6 +8,14 @@
|
|||
* Performs timing for gf arithmetic
|
||||
*/
|
||||
|
||||
#include "config.h"
|
||||
|
||||
#ifdef HAVE_POSIX_MEMALIGN
|
||||
#ifndef _XOPEN_SOURCE
|
||||
#define _XOPEN_SOURCE 600
|
||||
#endif
|
||||
#endif
|
||||
|
||||
#include <stdio.h>
|
||||
#include <getopt.h>
|
||||
#include <stdint.h>
|
||||
|
@ -95,6 +103,9 @@ int main(int argc, char **argv)
|
|||
time_t t0;
|
||||
uint8_t *ra, *rb;
|
||||
gf_general_t a;
|
||||
#ifndef HAVE_POSIX_MEMALIGN
|
||||
uint8_t *malloc_ra, *malloc_rb;
|
||||
#endif
|
||||
|
||||
|
||||
if (argc < 6) usage(NULL);
|
||||
|
@ -155,8 +166,17 @@ int main(int argc, char **argv)
|
|||
|
||||
printf("Seed: %ld\n", t0);
|
||||
|
||||
ra = (uint8_t *) malloc(size);
|
||||
rb = (uint8_t *) malloc(size);
|
||||
#ifdef HAVE_POSIX_MEMALIGN
|
||||
if (posix_memalign((void **) &ra, 16, size))
|
||||
ra = NULL;
|
||||
if (posix_memalign((void **) &rb, 16, size))
|
||||
rb = NULL;
|
||||
#else
|
||||
malloc_ra = (uint8_t *) malloc(size + 15);
|
||||
malloc_rb = (uint8_t *) malloc(size + 15);
|
||||
ra = (uint8_t *) (((uintptr_t) malloc_ra + 15) & ~((uintptr_t) 0xf));
|
||||
rb = (uint8_t *) (((uintptr_t) malloc_rb + 15) & ~((uintptr_t) 0xf));
|
||||
#endif
|
||||
|
||||
if (ra == NULL || rb == NULL) { perror("malloc"); exit(1); }
|
||||
|
||||
|
@ -188,8 +208,6 @@ int main(int argc, char **argv)
|
|||
if (tmethods[(int)test] == NULL) {
|
||||
printf("No %s method.\n", tstrings[(int)test]);
|
||||
} else {
|
||||
elapsed = 0;
|
||||
|
||||
if (test == '0') gf_general_set_zero(&a, w);
|
||||
if (test == '1') gf_general_set_one(&a, w);
|
||||
if (test == '2') gf_general_set_two(&a, w);
|
||||
|
|
|
@ -1,9 +0,0 @@
|
|||
#!/bin/bash
|
||||
|
||||
for w in 4 8 16 32 64 128 ; do
|
||||
./gf_methods $w -A -U | sh -e
|
||||
if [ $? != "0" ] ; then
|
||||
echo "Failed unit tests for w=$w"
|
||||
break
|
||||
fi
|
||||
done
|
|
@ -0,0 +1,367 @@
|
|||
#!/bin/bash -e
|
||||
|
||||
# this scripts has a number of tests for SIMD. It can be invoked
|
||||
# on the host or on a QEMU machine.
|
||||
|
||||
script_dir="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
|
||||
host_cpu=`uname -p`
|
||||
results=${script_dir}/test_simd.results
|
||||
nprocs=$(grep -c ^processor /proc/cpuinfo)
|
||||
|
||||
# runs unit tests and save the results
|
||||
test_unit(){
|
||||
{ ./configure && make clean && make; } || { echo "Compile FAILED" >> ${results}; return 1; }
|
||||
make -j$nprocs check || { echo "gf_methods $i FAILED" >> ${results}; ((++failed)); }
|
||||
cat tools/test-suite.log >> ${results} || true
|
||||
}
|
||||
|
||||
# build with DEBUG_FUNCTIONS and save all methods selected
|
||||
# to a results file
|
||||
test_functions() {
|
||||
failed=0
|
||||
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "Compile FAILED" >> ${results}; return 1; }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${results}; } || { echo "gf_methods $i FAILED" >> ${results}; ((++failed)); }
|
||||
done
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
# build with DEBUG_CPU_FUNCTIONS and print out CPU detection
|
||||
test_detection() {
|
||||
failed=0
|
||||
|
||||
{ ./configure --enable-debug-cpu && make clean && make; } || { echo "Compile FAILED" >> ${results}; return 1; }
|
||||
{ ${script_dir}/gf_methods 32 -ACD -L | grep '#' >> ${results}; } || { echo "gf_methods $i FAILED" >> ${results}; ((++failed)); }
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
compile_arm() {
|
||||
failed=0
|
||||
|
||||
echo -n "Compiling with NO SIMD support..." >> ${results}
|
||||
{ ./configure --disable-neon && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
echo -n "Compiling with FULL SIMD support..." >> ${results}
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
compile_intel() {
|
||||
failed=0
|
||||
|
||||
echo -n "Compiling with NO SIMD support..." >> ${results}
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
echo -n "Compiling with SSE2 only..." >> ${results}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=no
|
||||
export ax_cv_have_ssse3_ext=no
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
echo -n "Compiling with SSE2,SSE3 only..." >> ${results}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=no
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
echo -n "Compiling with SSE2,SSE3,SSSE3 only..." >> ${results}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=yes
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
echo -n "Compiling with SSE2,SSE3,SSSE3,SSE4_1 only..." >> ${results}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=yes
|
||||
export ax_cv_have_sse41_ext=yes
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
echo -n "Compiling with SSE2,SSE3,SSSE3,SSE4_2 only..." >> ${results}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=yes
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=yes
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
echo -n "Compiling with FULL SIMD support..." >> ${results}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=yes
|
||||
export ax_cv_have_sse41_ext=yes
|
||||
export ax_cv_have_sse42_ext=yes
|
||||
export ax_cv_have_pclmuldq_ext=yes
|
||||
{ ./configure && make clean && make && echo "SUCCESS" >> ${results}; } || { echo "FAIL" >> ${results}; ((++failed)); }
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
# test that we can compile the source code with different
|
||||
# SIMD options. We assume that we are running on processor
|
||||
# full SIMD support
|
||||
test_compile() {
|
||||
case $host_cpu in
|
||||
aarch64*|arm*) compile_arm ;;
|
||||
i[[3456]]86*|x86_64*|amd64*) compile_intel ;;
|
||||
esac
|
||||
}
|
||||
|
||||
# disable through build flags
|
||||
runtime_arm_flags() {
|
||||
failed=0
|
||||
|
||||
echo "====NO SIMD support..." >> ${1}
|
||||
{ ./configure --disable-neon --enable-debug-func && make clean && make; } || { echo "Compile FAILED" >> ${1}; return 1; }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====FULL SIMD support..." >> ${1}
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "Compile FAILED" >> ${1}; return 1; }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
# build once with FULL SIMD and disable at runtime through environment
|
||||
runtime_arm_env() {
|
||||
failed=0
|
||||
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "Compile FAILED" >> ${1}; return 1; }
|
||||
|
||||
echo "====NO SIMD support..." >> ${1}
|
||||
export GF_COMPLETE_DISABLE_NEON=1
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====FULL SIMD support..." >> ${1}
|
||||
unset GF_COMPLETE_DISABLE_NEON
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
runtime_intel_flags() {
|
||||
failed=0
|
||||
|
||||
echo "====NO SIMD support..." >> ${1}
|
||||
{ ./configure --disable-sse --enable-debug-func && make clean && make; } || { echo "FAIL" >> ${1}; ((++failed)); }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2 support..." >> ${1}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=no
|
||||
export ax_cv_have_ssse3_ext=no
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "FAIL" >> ${1}; ((++failed)); }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3 support..." >> ${1}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=no
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "FAIL" >> ${1}; ((++failed)); }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3,SSSE3 support..." >> ${1}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=yes
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "FAIL" >> ${1}; ((++failed)); }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3,SSSE3,SSE4_1 support..." >> ${1}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=yes
|
||||
export ax_cv_have_sse41_ext=yes
|
||||
export ax_cv_have_sse42_ext=no
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "FAIL" >> ${1}; ((++failed)); }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3,SSSE3,SSE4_2 support..." >> ${1}
|
||||
export ax_cv_have_sse_ext=no
|
||||
export ax_cv_have_sse2_ext=yes
|
||||
export ax_cv_have_sse3_ext=yes
|
||||
export ax_cv_have_ssse3_ext=yes
|
||||
export ax_cv_have_sse41_ext=no
|
||||
export ax_cv_have_sse42_ext=yes
|
||||
export ax_cv_have_pclmuldq_ext=no
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "FAIL" >> ${1}; ((++failed)); }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====FULL SIMD support..." >> ${1}
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "FAIL" >> ${1}; ((++failed)); }
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
runtime_intel_env() {
|
||||
failed=0
|
||||
|
||||
# compile a build with full SIMD support
|
||||
{ ./configure --enable-debug-func && make clean && make; } || { echo "Compile FAILED" >> ${1}; return 1; }
|
||||
|
||||
echo "====NO SIMD support..." >> ${1}
|
||||
export GF_COMPLETE_DISABLE_SSE2=1
|
||||
export GF_COMPLETE_DISABLE_SSE3=1
|
||||
export GF_COMPLETE_DISABLE_SSSE3=1
|
||||
export GF_COMPLETE_DISABLE_SSE4=1
|
||||
export GF_COMPLETE_DISABLE_SSE4_PCLMUL=1
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2 support..." >> ${1}
|
||||
unset GF_COMPLETE_DISABLE_SSE2
|
||||
export GF_COMPLETE_DISABLE_SSE3=1
|
||||
export GF_COMPLETE_DISABLE_SSSE3=1
|
||||
export GF_COMPLETE_DISABLE_SSE4=1
|
||||
export GF_COMPLETE_DISABLE_SSE4_PCLMUL=1
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3 support..." >> ${1}
|
||||
unset GF_COMPLETE_DISABLE_SSE2
|
||||
unset GF_COMPLETE_DISABLE_SSE3
|
||||
export GF_COMPLETE_DISABLE_SSSE3=1
|
||||
export GF_COMPLETE_DISABLE_SSE4=1
|
||||
export GF_COMPLETE_DISABLE_SSE4_PCLMUL=1
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3,SSSE3 support..." >> ${1}
|
||||
unset GF_COMPLETE_DISABLE_SSE2
|
||||
unset GF_COMPLETE_DISABLE_SSE3
|
||||
unset GF_COMPLETE_DISABLE_SSSE3
|
||||
export GF_COMPLETE_DISABLE_SSE4=1
|
||||
export GF_COMPLETE_DISABLE_SSE4_PCLMUL=1
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3,SSSE3,SSE4_1 support..." >> ${1}
|
||||
unset GF_COMPLETE_DISABLE_SSE2
|
||||
unset GF_COMPLETE_DISABLE_SSE3
|
||||
unset GF_COMPLETE_DISABLE_SSSE3
|
||||
unset GF_COMPLETE_DISABLE_SSE4
|
||||
export GF_COMPLETE_DISABLE_SSE4_PCLMUL=1
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====SSE2,SSE3,SSSE3,SSE4_2 support..." >> ${1}
|
||||
unset GF_COMPLETE_DISABLE_SSE2
|
||||
unset GF_COMPLETE_DISABLE_SSE3
|
||||
unset GF_COMPLETE_DISABLE_SSSE3
|
||||
unset GF_COMPLETE_DISABLE_SSE4
|
||||
export GF_COMPLETE_DISABLE_SSE4_PCLMUL=1
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
echo "====FULL SIMD support..." >> ${1}
|
||||
unset GF_COMPLETE_DISABLE_SSE2
|
||||
unset GF_COMPLETE_DISABLE_SSE3
|
||||
unset GF_COMPLETE_DISABLE_SSSE3
|
||||
unset GF_COMPLETE_DISABLE_SSE4
|
||||
unset GF_COMPLETE_DISABLE_SSE4_PCLMUL
|
||||
for i in 128 64 32 16 8 4; do
|
||||
{ ${script_dir}/gf_methods $i -ACD -X >> ${1}; } || { echo "gf_methods $i FAILED" >> ${1}; ((++failed)); }
|
||||
done
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
test_runtime() {
|
||||
rm -f ${results}.left
|
||||
rm -f ${results}.right
|
||||
|
||||
case $host_cpu in
|
||||
aarch64*|arm*)
|
||||
runtime_arm_flags ${results}.left
|
||||
runtime_arm_env ${results}.right
|
||||
;;
|
||||
i[[3456]]86*|x86_64*|amd64*)
|
||||
runtime_intel_flags ${results}.left
|
||||
runtime_intel_env ${results}.right
|
||||
;;
|
||||
esac
|
||||
|
||||
echo "======LEFT======" > ${results}
|
||||
cat ${results}.left >> ${results}
|
||||
echo "======RIGHT======" >> ${results}
|
||||
cat ${results}.right >> ${results}
|
||||
echo "======RESULT======" >> ${results}
|
||||
if diff "${results}.left" "${results}.right"; then
|
||||
echo SUCCESS >> ${results}
|
||||
return 0
|
||||
else
|
||||
echo SUCCESS >> ${results}
|
||||
return 1
|
||||
fi
|
||||
}
|
||||
|
||||
cd ${script_dir}/..
|
||||
rm -f ${results}
|
||||
|
||||
test_$1
|
||||
exit $?
|
|
@ -0,0 +1,258 @@
|
|||
#!/bin/bash -e
|
||||
|
||||
# This script will use QEMU to test gf-complete especially SIMD support
|
||||
# on different architectures and cpus. It will boot a qemu machine
|
||||
# and run an Ubuntu cloud image. All testing will happen inside the
|
||||
# QEMU machine.
|
||||
|
||||
# The following packages are required:
|
||||
# qemu-system-aarch64
|
||||
# qemu-system-arm
|
||||
# qemu-system-x86_64
|
||||
# genisoimage
|
||||
|
||||
|
||||
script_dir="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
|
||||
qemu_dir="${script_dir}/.qemu"
|
||||
ssh_port=2222
|
||||
ssh_pubkey_file="${qemu_dir}/qemu.pub"
|
||||
ssh_key_file="${qemu_dir}/qemu"
|
||||
|
||||
mkdir -p "${qemu_dir}"
|
||||
|
||||
cleanup() {
|
||||
if [[ -n "$(jobs -p)" ]]; then
|
||||
echo killing qemu processes "$(jobs -p)"
|
||||
kill $(jobs -p)
|
||||
fi
|
||||
}
|
||||
|
||||
trap cleanup EXIT
|
||||
|
||||
start_qemu() {
|
||||
arch=$1
|
||||
cpu=$2
|
||||
|
||||
image_version="xenial"
|
||||
image_url_base="http://cloud-images.ubuntu.com/${image_version}/current"
|
||||
|
||||
case $arch in
|
||||
i[[3456]]86*|x86_64*|amd64*)
|
||||
image_kernel="${image_version}-server-cloudimg-amd64-vmlinuz-generic"
|
||||
image_initrd="${image_version}-server-cloudimg-amd64-initrd-generic"
|
||||
image_disk="${image_version}-server-cloudimg-amd64-disk1.img"
|
||||
;;
|
||||
aarch64*)
|
||||
image_kernel="${image_version}-server-cloudimg-arm64-vmlinuz-generic"
|
||||
image_initrd="${image_version}-server-cloudimg-arm64-initrd-generic"
|
||||
image_disk="${image_version}-server-cloudimg-arm64-disk1.img"
|
||||
;;
|
||||
arm*)
|
||||
image_kernel="${image_version}-server-cloudimg-armhf-vmlinuz-lpae"
|
||||
image_initrd="${image_version}-server-cloudimg-armhf-initrd-generic-lpae"
|
||||
image_disk="${image_version}-server-cloudimg-armhf-disk1.img"
|
||||
;;
|
||||
*) die "Unsupported arch" ;;
|
||||
esac
|
||||
|
||||
[[ -f ${qemu_dir}/${image_kernel} ]] || wget -O ${qemu_dir}/${image_kernel} ${image_url_base}/unpacked/${image_kernel}
|
||||
[[ -f ${qemu_dir}/${image_initrd} ]] || wget -O ${qemu_dir}/${image_initrd} ${image_url_base}/unpacked/${image_initrd}
|
||||
[[ -f ${qemu_dir}/${image_disk} ]] || wget -O ${qemu_dir}/${image_disk} ${image_url_base}/${image_disk}
|
||||
|
||||
#create a delta disk to keep the original image clean
|
||||
delta_disk="${qemu_dir}/disk.img"
|
||||
rm -f ${delta_disk}
|
||||
qemu-img create -q -f qcow2 -b "${qemu_dir}/${image_disk}" ${delta_disk}
|
||||
|
||||
# generate an ssh keys
|
||||
[[ -f ${ssh_pubkey_file} ]] || ssh-keygen -q -N "" -f ${ssh_key_file}
|
||||
|
||||
# create a config disk to set the SSH keys
|
||||
cat > "${qemu_dir}/meta-data" <<EOF
|
||||
instance-id: qemu
|
||||
local-hostname: qemu
|
||||
EOF
|
||||
cat > "${qemu_dir}/user-data" <<EOF
|
||||
#cloud-config
|
||||
hostname: qemu
|
||||
manage_etc_hosts: true
|
||||
users:
|
||||
- name: qemu
|
||||
ssh-authorized-keys:
|
||||
- $(cat "${ssh_pubkey_file}")
|
||||
sudo: ['ALL=(ALL) NOPASSWD:ALL']
|
||||
groups: sudo
|
||||
shell: /bin/bash
|
||||
EOF
|
||||
genisoimage -quiet -output "${qemu_dir}/cloud.iso" -volid cidata -joliet -rock "${qemu_dir}/user-data" "${qemu_dir}/meta-data"
|
||||
|
||||
common_args=( \
|
||||
-name "qemu" \
|
||||
-m 1024 \
|
||||
-nodefaults \
|
||||
-nographic \
|
||||
-kernel ${qemu_dir}/${image_kernel} \
|
||||
-initrd ${qemu_dir}/${image_initrd} \
|
||||
-cdrom ${qemu_dir}/cloud.iso \
|
||||
-serial file:${qemu_dir}/console.log
|
||||
)
|
||||
|
||||
case $arch in
|
||||
i[[3456]]86*|x86_64*|amd64*)
|
||||
qemu-system-x86_64 \
|
||||
"${common_args[@]}" \
|
||||
-machine accel=kvm -cpu $cpu \
|
||||
-append "console=ttyS0 root=/dev/sda1" \
|
||||
-hda "${delta_disk}" \
|
||||
-net nic,vlan=0,model=virtio \
|
||||
-net user,vlan=0,hostfwd=tcp::"${ssh_port}"-:22,hostname="${vm_name}" \
|
||||
&
|
||||
;;
|
||||
aarch64*|arm*)
|
||||
qemu-system-$arch \
|
||||
"${common_args[@]}" \
|
||||
-machine virt -cpu $cpu -machine type=virt -smp 1 \
|
||||
-drive if=none,file="${delta_disk}",id=hd0 \
|
||||
-device virtio-blk-device,drive=hd0 \
|
||||
-append "console=ttyAMA0 root=/dev/vda1" \
|
||||
-netdev user,id=eth0,hostfwd=tcp::"${ssh_port}"-:22,hostname="${vm_name}" \
|
||||
-device virtio-net-device,netdev=eth0 \
|
||||
&
|
||||
;;
|
||||
*) die "Unsupported arch" ;;
|
||||
esac
|
||||
|
||||
wait_for_ssh
|
||||
}
|
||||
|
||||
stop_qemu() {
|
||||
run_ssh "sudo shutdown now" || true
|
||||
wait $(jobs -p)
|
||||
}
|
||||
|
||||
shared_args=(
|
||||
-i ${ssh_key_file}
|
||||
-F /dev/null
|
||||
-o BatchMode=yes
|
||||
-o UserKnownHostsFile=/dev/null
|
||||
-o StrictHostKeyChecking=no
|
||||
-o IdentitiesOnly=yes
|
||||
)
|
||||
|
||||
ssh_args=(
|
||||
${shared_args[*]}
|
||||
-p ${ssh_port}
|
||||
)
|
||||
|
||||
wait_for_ssh() {
|
||||
retries=0
|
||||
retry_count=50
|
||||
|
||||
echo "waiting for machine to come up."
|
||||
echo "tail -F ${qemu_dir}/console.log for progress."
|
||||
|
||||
while true; do
|
||||
set +e
|
||||
ssh -q ${ssh_args[*]} -o ConnectTimeout=1 qemu@localhost "echo done"
|
||||
error=$?
|
||||
set -e
|
||||
if [[ $error == 0 ]]; then
|
||||
return 0
|
||||
fi
|
||||
|
||||
if [[ ${retries} == ${retry_count} ]]; then
|
||||
echo "timeout"
|
||||
return 1
|
||||
fi
|
||||
|
||||
echo -n "."
|
||||
((++retries))
|
||||
sleep 10
|
||||
done
|
||||
}
|
||||
|
||||
run_ssh() {
|
||||
ssh -q ${ssh_args[*]} qemu@localhost "$@"
|
||||
}
|
||||
|
||||
run_scp() {
|
||||
scp -q ${shared_args[*]} -P ${ssh_port} "$@"
|
||||
}
|
||||
|
||||
rsync_args=(
|
||||
--exclude '.qemu'
|
||||
--exclude '.git'
|
||||
)
|
||||
|
||||
run_rsync() {
|
||||
rsync -avz -e "ssh ${ssh_args[*]}" ${rsync_args[*]} "$@"
|
||||
}
|
||||
|
||||
init_machine() {
|
||||
run_ssh "sudo apt-get -y install --no-install-recommends make gcc autoconf libtool automake"
|
||||
}
|
||||
|
||||
init_machine_and_copy_source() {
|
||||
init_machine
|
||||
run_ssh "rm -fr ~/gf-complete; mkdir -p ~/gf-complete"
|
||||
run_rsync ${script_dir}/.. qemu@localhost:gf-complete
|
||||
run_ssh "cd ~/gf-complete && ./autogen.sh"
|
||||
}
|
||||
|
||||
run_test() {
|
||||
arch=$1; shift
|
||||
cpu=$1; shift
|
||||
test=$1; shift
|
||||
|
||||
run_ssh "~/gf-complete/tools/test_simd.sh ${test}"
|
||||
run_scp qemu@localhost:gf-complete/tools/test_simd.results ${script_dir}/test_simd_${test}_${arch}_${cpu}.results
|
||||
}
|
||||
|
||||
# this test run the unit tests on the machine using "make check"
|
||||
run_test_simd_basic() {
|
||||
arch=$1; shift
|
||||
cpu=$1; shift
|
||||
|
||||
failed=0
|
||||
|
||||
echo "=====starting qemu machine $arch $cpu"
|
||||
start_qemu $arch $cpu
|
||||
init_machine_and_copy_source
|
||||
echo "=====running compile test"
|
||||
{ run_test $arch $cpu "compile" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
echo "=====running unit test"
|
||||
{ run_test $arch $cpu "unit" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
echo "=====running functions test"
|
||||
{ run_test $arch $cpu "functions" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
echo "=====running detection test"
|
||||
{ run_test $arch $cpu "detection" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
echo "=====running runtime test"
|
||||
{ run_test $arch $cpu "runtime" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
stop_qemu
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
run_all_tests() {
|
||||
failed=0
|
||||
|
||||
echo ============================
|
||||
echo =====running x86_64 tests
|
||||
# NOTE: Broadwell has all the supported SIMD instructions
|
||||
{ run_test_simd_basic "x86_64" "Broadwell" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
|
||||
echo ============================
|
||||
echo =====running aarch64 tests
|
||||
# NOTE: cortex-a57 has ASIMD support
|
||||
{ run_test_simd_basic "aarch64" "cortex-a57" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
|
||||
echo ============================
|
||||
echo =====running arm tests
|
||||
# NOTE: cortex-a15 has NEON support
|
||||
{ run_test_simd_basic "arm" "cortex-a15" && echo "SUCCESS"; } || { echo "FAILED"; ((++failed)); }
|
||||
|
||||
return ${failed}
|
||||
}
|
||||
|
||||
run_all_tests
|
||||
exit $?
|