2008-07-18 12:55:51 +08:00
|
|
|
/*
|
2008-07-28 05:00:59 +08:00
|
|
|
* include/asm/xor.h
|
2008-07-18 12:55:51 +08:00
|
|
|
*
|
|
|
|
* High speed xor_block operation for RAID4/5 utilizing the
|
|
|
|
* UltraSparc Visual Instruction Set and Niagara block-init
|
|
|
|
* twin-load instructions.
|
|
|
|
*
|
|
|
|
* Copyright (C) 1997, 1999 Jakub Jelinek (jj@ultra.linux.cz)
|
|
|
|
* Copyright (C) 2006 David S. Miller <davem@davemloft.net>
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation; either version 2, or (at your option)
|
|
|
|
* any later version.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* (for example /usr/src/linux/COPYING); if not, write to the Free
|
|
|
|
* Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <asm/spitfire.h>
|
|
|
|
|
2014-05-17 05:25:50 +08:00
|
|
|
void xor_vis_2(unsigned long, unsigned long *, unsigned long *);
|
|
|
|
void xor_vis_3(unsigned long, unsigned long *, unsigned long *,
|
|
|
|
unsigned long *);
|
|
|
|
void xor_vis_4(unsigned long, unsigned long *, unsigned long *,
|
|
|
|
unsigned long *, unsigned long *);
|
|
|
|
void xor_vis_5(unsigned long, unsigned long *, unsigned long *,
|
|
|
|
unsigned long *, unsigned long *, unsigned long *);
|
2008-07-18 12:55:51 +08:00
|
|
|
|
|
|
|
/* XXX Ugh, write cheetah versions... -DaveM */
|
|
|
|
|
|
|
|
static struct xor_block_template xor_block_VIS = {
|
|
|
|
.name = "VIS",
|
|
|
|
.do_2 = xor_vis_2,
|
|
|
|
.do_3 = xor_vis_3,
|
|
|
|
.do_4 = xor_vis_4,
|
|
|
|
.do_5 = xor_vis_5,
|
|
|
|
};
|
|
|
|
|
2014-05-17 05:25:50 +08:00
|
|
|
void xor_niagara_2(unsigned long, unsigned long *, unsigned long *);
|
|
|
|
void xor_niagara_3(unsigned long, unsigned long *, unsigned long *,
|
|
|
|
unsigned long *);
|
|
|
|
void xor_niagara_4(unsigned long, unsigned long *, unsigned long *,
|
|
|
|
unsigned long *, unsigned long *);
|
|
|
|
void xor_niagara_5(unsigned long, unsigned long *, unsigned long *,
|
|
|
|
unsigned long *, unsigned long *, unsigned long *);
|
2008-07-18 12:55:51 +08:00
|
|
|
|
|
|
|
static struct xor_block_template xor_block_niagara = {
|
|
|
|
.name = "Niagara",
|
|
|
|
.do_2 = xor_niagara_2,
|
|
|
|
.do_3 = xor_niagara_3,
|
|
|
|
.do_4 = xor_niagara_4,
|
|
|
|
.do_5 = xor_niagara_5,
|
|
|
|
};
|
|
|
|
|
|
|
|
#undef XOR_TRY_TEMPLATES
|
|
|
|
#define XOR_TRY_TEMPLATES \
|
|
|
|
do { \
|
|
|
|
xor_speed(&xor_block_VIS); \
|
|
|
|
xor_speed(&xor_block_niagara); \
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
/* For VIS for everything except Niagara. */
|
|
|
|
#define XOR_SELECT_TEMPLATE(FASTEST) \
|
|
|
|
((tlb_type == hypervisor && \
|
|
|
|
(sun4v_chip_type == SUN4V_CHIP_NIAGARA1 || \
|
sparc: Detect and handle UltraSPARC-T3 cpu types.
The cpu compatible string we look for is "SPARC-T3".
As far as memset/memcpy optimizations go, we treat this chip the same
as Niagara-T2/T2+. Use cache initializing stores for memset, and use
perfetch, FPU block loads, cache initializing stores, and block stores
for copies.
We use the Niagara-T2 perf support, since T3 is a close relative in
this regard. Later we'll add support for the new events T3 can
report, plus enable T3's new "sample" mode.
For now I haven't added any new ELF hwcap flags. We probably need
to add a couple, for example:
T2 and T3 both support the population count instruction in hardware.
T3 supports VIS3 instructions, including support (finally) for
partitioned shift. One can also now move directly between float
and integer registers.
T3 supports instructions meant to help with Galois Field and other HPC
calculations, such as XOR multiply. Also there are "OP and negate"
instructions, for example "fnmul" which is multiply-and-negate.
T3 recognizes the transactional memory opcodes, however since
transactional memory isn't supported: 1) 'commit' behaves as a NOP and
2) 'chkpt' always branches 3) 'rdcps' returns all zeros and 4) 'wrcps'
behaves as a NOP.
So we'll need about 3 new elf capability flags in the end to represent
all of these things.
Signed-off-by: David S. Miller <davem@davemloft.net>
2011-07-28 12:06:16 +08:00
|
|
|
sun4v_chip_type == SUN4V_CHIP_NIAGARA2 || \
|
2011-09-12 01:42:20 +08:00
|
|
|
sun4v_chip_type == SUN4V_CHIP_NIAGARA3 || \
|
|
|
|
sun4v_chip_type == SUN4V_CHIP_NIAGARA4 || \
|
|
|
|
sun4v_chip_type == SUN4V_CHIP_NIAGARA5)) ? \
|
2008-07-18 12:55:51 +08:00
|
|
|
&xor_block_niagara : \
|
|
|
|
&xor_block_VIS)
|