1aaf4363eSJerin Jacob /* SPDX-License-Identifier: BSD-3-Clause
2aaf4363eSJerin Jacob * Copyright(c) 2017 Cavium, Inc
3f0c7bb1bSJerin Jacob */
4f0c7bb1bSJerin Jacob
5f0c7bb1bSJerin Jacob #ifndef __OCTEONTX_IO_H__
6f0c7bb1bSJerin Jacob #define __OCTEONTX_IO_H__
7f0c7bb1bSJerin Jacob
8f0c7bb1bSJerin Jacob #include <stddef.h>
9f0c7bb1bSJerin Jacob #include <stdint.h>
10f0c7bb1bSJerin Jacob
11f0c7bb1bSJerin Jacob #include <rte_io.h>
12f0c7bb1bSJerin Jacob
1395a6b04fSAnoob Joseph /* In Cavium OCTEON TX SoC, all accesses to the device registers are
14f0c7bb1bSJerin Jacob * implicitly strongly ordered. So, The relaxed version of IO operation is
15f0c7bb1bSJerin Jacob * safe to use with out any IO memory barriers.
16f0c7bb1bSJerin Jacob */
17f0c7bb1bSJerin Jacob #define octeontx_read64 rte_read64_relaxed
18f0c7bb1bSJerin Jacob #define octeontx_write64 rte_write64_relaxed
19f0c7bb1bSJerin Jacob
20f0c7bb1bSJerin Jacob /* ARM64 specific functions */
21f0c7bb1bSJerin Jacob #if defined(RTE_ARCH_ARM64)
22*93998f3cSTyler Retzlaff #define octeontx_prefetch_store_keep(_ptr) __extension__ ({\
23f0c7bb1bSJerin Jacob asm volatile("prfm pstl1keep, %a0\n" : : "p" (_ptr)); })
24f0c7bb1bSJerin Jacob
25*93998f3cSTyler Retzlaff #define octeontx_load_pair(val0, val1, addr) __extension__ ({ \
26f0c7bb1bSJerin Jacob asm volatile( \
27f0c7bb1bSJerin Jacob "ldp %x[x0], %x[x1], [%x[p1]]" \
28f0c7bb1bSJerin Jacob :[x0]"=r"(val0), [x1]"=r"(val1) \
29f0c7bb1bSJerin Jacob :[p1]"r"(addr) \
30f0c7bb1bSJerin Jacob ); })
31f0c7bb1bSJerin Jacob
32*93998f3cSTyler Retzlaff #define octeontx_store_pair(val0, val1, addr) __extension__ ({ \
33f0c7bb1bSJerin Jacob asm volatile( \
34f0c7bb1bSJerin Jacob "stp %x[x0], %x[x1], [%x[p1]]" \
35f0c7bb1bSJerin Jacob ::[x0]"r"(val0), [x1]"r"(val1), [p1]"r"(addr) \
36f0c7bb1bSJerin Jacob ); })
37f0c7bb1bSJerin Jacob #else /* Un optimized functions for building on non arm64 arch */
38f0c7bb1bSJerin Jacob
39f0c7bb1bSJerin Jacob #define octeontx_prefetch_store_keep(_ptr) do {} while (0)
40f0c7bb1bSJerin Jacob
41f0c7bb1bSJerin Jacob #define octeontx_load_pair(val0, val1, addr) \
42f0c7bb1bSJerin Jacob do { \
43f0c7bb1bSJerin Jacob val0 = rte_read64(addr); \
44f0c7bb1bSJerin Jacob val1 = rte_read64(((uint8_t *)addr) + 8); \
45f0c7bb1bSJerin Jacob } while (0)
46f0c7bb1bSJerin Jacob
47f0c7bb1bSJerin Jacob #define octeontx_store_pair(val0, val1, addr) \
48f0c7bb1bSJerin Jacob do { \
49f0c7bb1bSJerin Jacob rte_write64(val0, addr); \
50f0c7bb1bSJerin Jacob rte_write64(val1, (((uint8_t *)addr) + 8)); \
51f0c7bb1bSJerin Jacob } while (0)
52f0c7bb1bSJerin Jacob #endif
53f0c7bb1bSJerin Jacob
54f0c7bb1bSJerin Jacob #if defined(RTE_ARCH_ARM64)
55e88bd474SRuifeng Wang #if defined(__ARM_FEATURE_SVE)
56e88bd474SRuifeng Wang #define __LSE_PREAMBLE " .cpu generic+lse+sve\n"
57e88bd474SRuifeng Wang #else
58e88bd474SRuifeng Wang #define __LSE_PREAMBLE " .cpu generic+lse\n"
59e88bd474SRuifeng Wang #endif
60f0c7bb1bSJerin Jacob /**
61f0c7bb1bSJerin Jacob * Perform an atomic fetch-and-add operation.
62f0c7bb1bSJerin Jacob */
63f0c7bb1bSJerin Jacob static inline uint64_t
octeontx_reg_ldadd_u64(void * addr,int64_t off)64f0c7bb1bSJerin Jacob octeontx_reg_ldadd_u64(void *addr, int64_t off)
65f0c7bb1bSJerin Jacob {
66f0c7bb1bSJerin Jacob uint64_t old_val;
67f0c7bb1bSJerin Jacob
68f0c7bb1bSJerin Jacob __asm__ volatile(
69e88bd474SRuifeng Wang __LSE_PREAMBLE
70f0c7bb1bSJerin Jacob " ldadd %1, %0, [%2]\n"
71f0c7bb1bSJerin Jacob : "=r" (old_val) : "r" (off), "r" (addr) : "memory");
72f0c7bb1bSJerin Jacob
73f0c7bb1bSJerin Jacob return old_val;
74f0c7bb1bSJerin Jacob }
75f0c7bb1bSJerin Jacob
76f0c7bb1bSJerin Jacob /**
77f0c7bb1bSJerin Jacob * Perform a LMTST operation - an atomic write of up to 128 byte to
78f0c7bb1bSJerin Jacob * an I/O block that supports this operation type.
79f0c7bb1bSJerin Jacob *
80f0c7bb1bSJerin Jacob * @param lmtline_va is the address where LMTLINE is mapped
81f0c7bb1bSJerin Jacob * @param ioreg_va is the virtual address of the device register
82f0c7bb1bSJerin Jacob * @param cmdbuf is the array of peripheral commands to execute
83f0c7bb1bSJerin Jacob * @param cmdsize is the number of 64-bit words in 'cmdbuf'
84f0c7bb1bSJerin Jacob *
85f0c7bb1bSJerin Jacob * @return N/A
86f0c7bb1bSJerin Jacob */
87f0c7bb1bSJerin Jacob static inline void
octeontx_reg_lmtst(void * lmtline_va,void * ioreg_va,const uint64_t cmdbuf[],uint64_t cmdsize)88f0c7bb1bSJerin Jacob octeontx_reg_lmtst(void *lmtline_va, void *ioreg_va, const uint64_t cmdbuf[],
89f0c7bb1bSJerin Jacob uint64_t cmdsize)
90f0c7bb1bSJerin Jacob {
91f0c7bb1bSJerin Jacob uint64_t result;
92f0c7bb1bSJerin Jacob uint64_t word_count;
93f0c7bb1bSJerin Jacob uint64_t *lmtline = lmtline_va;
94f0c7bb1bSJerin Jacob
95f0c7bb1bSJerin Jacob word_count = cmdsize;
96f0c7bb1bSJerin Jacob
97f0c7bb1bSJerin Jacob do {
98f0c7bb1bSJerin Jacob /* Copy commands to LMTLINE */
99f0c7bb1bSJerin Jacob for (result = 0; result < word_count; result += 2) {
100f0c7bb1bSJerin Jacob lmtline[result + 0] = cmdbuf[result + 0];
101f0c7bb1bSJerin Jacob lmtline[result + 1] = cmdbuf[result + 1];
102f0c7bb1bSJerin Jacob }
103f0c7bb1bSJerin Jacob
104f0c7bb1bSJerin Jacob /* LDEOR initiates atomic transfer to I/O device */
105f0c7bb1bSJerin Jacob __asm__ volatile(
106e88bd474SRuifeng Wang __LSE_PREAMBLE
107f0c7bb1bSJerin Jacob " ldeor xzr, %0, [%1]\n"
108f0c7bb1bSJerin Jacob : "=r" (result) : "r" (ioreg_va) : "memory");
109f0c7bb1bSJerin Jacob } while (!result);
110f0c7bb1bSJerin Jacob }
111f0c7bb1bSJerin Jacob
112e88bd474SRuifeng Wang #undef __LSE_PREAMBLE
113f0c7bb1bSJerin Jacob #else
114f0c7bb1bSJerin Jacob
115f0c7bb1bSJerin Jacob static inline uint64_t
octeontx_reg_ldadd_u64(void * addr,int64_t off)116f0c7bb1bSJerin Jacob octeontx_reg_ldadd_u64(void *addr, int64_t off)
117f0c7bb1bSJerin Jacob {
118f0c7bb1bSJerin Jacob RTE_SET_USED(addr);
119f0c7bb1bSJerin Jacob RTE_SET_USED(off);
120f0c7bb1bSJerin Jacob return 0;
121f0c7bb1bSJerin Jacob }
122f0c7bb1bSJerin Jacob
123f0c7bb1bSJerin Jacob static inline void
octeontx_reg_lmtst(void * lmtline_va,void * ioreg_va,const uint64_t cmdbuf[],uint64_t cmdsize)124f0c7bb1bSJerin Jacob octeontx_reg_lmtst(void *lmtline_va, void *ioreg_va, const uint64_t cmdbuf[],
125f0c7bb1bSJerin Jacob uint64_t cmdsize)
126f0c7bb1bSJerin Jacob {
127f0c7bb1bSJerin Jacob RTE_SET_USED(lmtline_va);
128f0c7bb1bSJerin Jacob RTE_SET_USED(ioreg_va);
129f0c7bb1bSJerin Jacob RTE_SET_USED(cmdbuf);
130f0c7bb1bSJerin Jacob RTE_SET_USED(cmdsize);
131f0c7bb1bSJerin Jacob }
132f0c7bb1bSJerin Jacob
133f0c7bb1bSJerin Jacob #endif
134f0c7bb1bSJerin Jacob #endif /* __OCTEONTX_IO_H__ */
135