mirror of
https://github.com/sockspls/badfish
synced 2025-04-29 16:23:09 +00:00
Added gcc -msse3 support
It is enabled when selecting x86-64-modern target, this gives another nice speed up: On a Core i5-2500 (3300 Mhz, Sandy Bridge): 64 bit download version: 1597151 n/s -flto : 1659664 n/s -flto -msse3: 1732344 n/s Patch suggested by Tom Vijlbrief. Also unify flto, popcount and msse3 optimization under "modern" target, note that this can break the "modern" build on old gcc that do not support -flto option: in this case update gcc ;-) or default to the standard build. No functional change. Signed-off-by: Marco Costalba <mcostalba@gmail.com>
This commit is contained in:
parent
09b5949cd2
commit
325dedc7da
1 changed files with 19 additions and 21 deletions
40
src/Makefile
40
src/Makefile
|
@ -42,17 +42,16 @@ OBJS = benchmark.o bitbase.o bitboard.o book.o endgame.o evaluate.o main.o \
|
||||||
# flag --- Comp switch --- Description
|
# flag --- Comp switch --- Description
|
||||||
# ----------------------------------------------------------------------------
|
# ----------------------------------------------------------------------------
|
||||||
#
|
#
|
||||||
# debug = no/yes --- -DNDEBUG --- Enable/Disable debug mode
|
# debug = yes/no --- -DNDEBUG --- Enable/Disable debug mode
|
||||||
# optimize = yes/no --- (-O3/-fast etc.) --- Enable/Disable optimizations
|
# optimize = yes/no --- (-O3/-fast etc.) --- Enable/Disable optimizations
|
||||||
# arch = (name) --- (-arch) --- Target architecture
|
# arch = (name) --- (-arch) --- Target architecture
|
||||||
# os = (name) --- --- Target operating system
|
# os = (name) --- --- Target operating system
|
||||||
# bits = 64/32 --- -DIS_64BIT --- 64-/32-bit operating system
|
# bits = 64/32 --- -DIS_64BIT --- 64-/32-bit operating system
|
||||||
# bigendian = no/yes --- -DBIGENDIAN --- big/little-endian byte order
|
# bigendian = yes/no --- -DBIGENDIAN --- big/little-endian byte order
|
||||||
# prefetch = no/yes --- -DUSE_PREFETCH --- Use prefetch x86 asm-instruction
|
# prefetch = yes/no --- -DUSE_PREFETCH --- Use prefetch x86 asm-instruction
|
||||||
# bsfq = no/yes --- -DUSE_BSFQ --- Use bsfq x86_64 asm-instruction
|
# bsfq = yes/no --- -DUSE_BSFQ --- Use bsfq x86_64 asm-instruction (only
|
||||||
# --- (Works only with GCC and ICC 64-bit)
|
# with GCC and ICC 64-bit)
|
||||||
# popcnt = no/yes --- -DUSE_POPCNT --- Use popcnt x86_64 asm-instruction
|
# popcnt = yes/no --- -DUSE_POPCNT --- Use popcnt x86_64 asm-instruction
|
||||||
# lto = no/yes --- -flto --- gcc Link Time Optimization
|
|
||||||
#
|
#
|
||||||
# Note that Makefile is space sensitive, so when adding new architectures
|
# Note that Makefile is space sensitive, so when adding new architectures
|
||||||
# or modifying existing flags, you have to make sure there are no extra spaces
|
# or modifying existing flags, you have to make sure there are no extra spaces
|
||||||
|
@ -124,7 +123,6 @@ ifeq ($(ARCH),x86-64-modern)
|
||||||
prefetch = yes
|
prefetch = yes
|
||||||
bsfq = yes
|
bsfq = yes
|
||||||
popcnt = yes
|
popcnt = yes
|
||||||
lto = yes
|
|
||||||
endif
|
endif
|
||||||
|
|
||||||
ifeq ($(ARCH),x86-32)
|
ifeq ($(ARCH),x86-32)
|
||||||
|
@ -311,14 +309,14 @@ endif
|
||||||
### 3.10 popcnt
|
### 3.10 popcnt
|
||||||
ifeq ($(popcnt),yes)
|
ifeq ($(popcnt),yes)
|
||||||
CXXFLAGS += -DUSE_POPCNT
|
CXXFLAGS += -DUSE_POPCNT
|
||||||
endif
|
|
||||||
|
|
||||||
### 3.11 lto.
|
### For gcc we add also msse3 support and Link Time Optimization, note that
|
||||||
### Note that this is a mix of compile and link time options
|
### this is a mix of compile and link time options because the lto link phase
|
||||||
### because the lto link phase needs access to the optimization flags
|
### needs access to the optimization flags.
|
||||||
ifeq ($(lto),yes)
|
ifeq ($(comp),gcc)
|
||||||
CXXFLAGS += -flto
|
CXXFLAGS += -msse3 -flto
|
||||||
LDFLAGS += $(CXXFLAGS) -static
|
LDFLAGS += $(CXXFLAGS) -static
|
||||||
|
endif
|
||||||
endif
|
endif
|
||||||
|
|
||||||
### ==========================================================================
|
### ==========================================================================
|
||||||
|
@ -335,7 +333,7 @@ help:
|
||||||
@echo ""
|
@echo ""
|
||||||
@echo "build > Build unoptimized version"
|
@echo "build > Build unoptimized version"
|
||||||
@echo "profile-build > Build PGO-optimized version"
|
@echo "profile-build > Build PGO-optimized version"
|
||||||
@echo "popcnt-profile-build > Build PGO-optimized version with optional popcnt-support"
|
@echo "double-profile-build > Build PGO-optimized version with and without popcnt support"
|
||||||
@echo "strip > Strip executable"
|
@echo "strip > Strip executable"
|
||||||
@echo "install > Install executable"
|
@echo "install > Install executable"
|
||||||
@echo "clean > Clean up"
|
@echo "clean > Clean up"
|
||||||
|
@ -344,7 +342,7 @@ help:
|
||||||
@echo "Supported archs:"
|
@echo "Supported archs:"
|
||||||
@echo ""
|
@echo ""
|
||||||
@echo "x86-64 > x86 64-bit"
|
@echo "x86-64 > x86 64-bit"
|
||||||
@echo "x86-64-modern > x86 64-bit with runtime support for popcnt-instruction"
|
@echo "x86-64-modern > x86 64-bit with runtime support for popcnt instruction"
|
||||||
@echo "x86-32 > x86 32-bit excluding very old hardware without SSE-support"
|
@echo "x86-32 > x86 32-bit excluding very old hardware without SSE-support"
|
||||||
@echo "x86-32-old > x86 32-bit including also very old hardware"
|
@echo "x86-32-old > x86 32-bit including also very old hardware"
|
||||||
@echo "osx-ppc-64 > PPC-Mac OS X 64 bit"
|
@echo "osx-ppc-64 > PPC-Mac OS X 64 bit"
|
||||||
|
@ -396,7 +394,7 @@ profile-build:
|
||||||
@echo "Step 4/4. Deleting profile data ..."
|
@echo "Step 4/4. Deleting profile data ..."
|
||||||
$(MAKE) ARCH=$(ARCH) COMP=$(COMP) $(profile_clean)
|
$(MAKE) ARCH=$(ARCH) COMP=$(COMP) $(profile_clean)
|
||||||
|
|
||||||
popcnt-profile-build:
|
double-profile-build:
|
||||||
$(MAKE) ARCH=$(ARCH) COMP=$(COMP) config-sanity
|
$(MAKE) ARCH=$(ARCH) COMP=$(COMP) config-sanity
|
||||||
@echo ""
|
@echo ""
|
||||||
@echo "Step 0/6. Preparing for profile build."
|
@echo "Step 0/6. Preparing for profile build."
|
||||||
|
|
Loading…
Add table
Reference in a new issue