neon64_mem.hh revision 10037
1/*
2 * Copyright (c) 2012-2013 ARM Limited
3 * All rights reserved
4 *
5 * The license below extends only to copyright in the software and shall
6 * not be construed as granting a license to any other intellectual
7 * property including but not limited to intellectual property relating
8 * to a hardware implementation of the functionality of the software
9 * licensed hereunder.  You may use the software subject to the license
10 * terms below provided that you ensure that this notice is replicated
11 * unmodified and in its entirety in all distributions of the software,
12 * modified or unmodified, in source code or in binary form.
13 *
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions are
16 * met: redistributions of source code must retain the above copyright
17 * notice, this list of conditions and the following disclaimer;
18 * redistributions in binary form must reproduce the above copyright
19 * notice, this list of conditions and the following disclaimer in the
20 * documentation and/or other materials provided with the distribution;
21 * neither the name of the copyright holders nor the names of its
22 * contributors may be used to endorse or promote products derived from
23 * this software without specific prior written permission.
24 *
25 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
26 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
27 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
28 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
29 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
30 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
31 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
32 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
33 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
34 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
35 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 *
37 * Authors: Mbou Eyole
38 *          Giacomo Gabrielli
39 */
40
41/// @file
42/// Utility functions and datatypes used by AArch64 NEON memory instructions.
43
44#ifndef __ARCH_ARM_INSTS_NEON64_MEM_HH__
45#define __ARCH_ARM_INSTS_NEON64_MEM_HH__
46
47namespace ArmISA
48{
49
50typedef uint64_t XReg;
51
52/// 128-bit NEON vector register.
53struct VReg {
54    XReg hi;
55    XReg lo;
56};
57
58/// Write a single NEON vector element leaving the others untouched.
59inline void
60writeVecElem(VReg *dest, XReg src, int index, int eSize)
61{
62    // eSize must be less than 4:
63    // 0 -> 8-bit elems,
64    // 1 -> 16-bit elems,
65    // 2 -> 32-bit elems,
66    // 3 -> 64-bit elems
67    assert(eSize <= 3);
68
69    int eBits = 8 << eSize;
70    int lsbPos = index * eBits;
71    assert(lsbPos < 128);
72    int shiftAmt = lsbPos % 64;
73
74    XReg maskBits = -1;
75    if (eBits == 64) {
76        maskBits = 0;
77    } else {
78        maskBits = maskBits << eBits;
79    }
80    maskBits = ~maskBits;
81
82    XReg sMask = maskBits;
83    maskBits = sMask << shiftAmt;
84
85    if (lsbPos < 64) {
86        dest->lo = (dest->lo & (~maskBits)) | ((src & sMask) << shiftAmt);
87    } else {
88        dest->hi = (dest->hi & (~maskBits)) | ((src & sMask) << shiftAmt);
89    }
90}
91
92/// Read a single NEON vector element.
93inline XReg
94readVecElem(VReg src, int index, int eSize)
95{
96    // eSize must be less than 4:
97    // 0 -> 8-bit elems,
98    // 1 -> 16-bit elems,
99    // 2 -> 32-bit elems,
100    // 3 -> 64-bit elems
101    assert(eSize <= 3);
102
103    XReg data;
104
105    int eBits = 8 << eSize;
106    int lsbPos = index * eBits;
107    assert(lsbPos < 128);
108    int shiftAmt = lsbPos % 64;
109
110    XReg maskBits = -1;
111    if (eBits == 64) {
112        maskBits = 0;
113    } else {
114        maskBits = maskBits << eBits;
115    }
116    maskBits = ~maskBits;
117
118    if (lsbPos < 64) {
119        data = (src.lo >> shiftAmt) & maskBits;
120    } else {
121        data = (src.hi >> shiftAmt) & maskBits;
122    }
123    return data;
124}
125
126}  // namespace ArmISA
127
128#endif  // __ARCH_ARM_INSTS_NEON64_MEM_HH__
129