1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33#include <linux/module.h>
34#include <rdma/ib_umem.h>
35#include <rdma/ib_umem_odp.h>
36#include "mlx5_ib.h"
37
38
39
40
41
42
43
44
45void mlx5_ib_cont_pages(struct ib_umem *umem, u64 addr, int *count, int *shift,
46 int *ncont, int *order)
47{
48 unsigned long tmp;
49 unsigned long m;
50 int i, k;
51 u64 base = 0;
52 int p = 0;
53 int skip;
54 int mask;
55 u64 len;
56 u64 pfn;
57 struct scatterlist *sg;
58 int entry;
59 unsigned long page_shift = ilog2(umem->page_size);
60
61
62 if (umem->odp_data) {
63 *count = ib_umem_page_count(umem);
64 *shift = PAGE_SHIFT;
65 *ncont = *count;
66 if (order)
67 *order = ilog2(roundup_pow_of_two(*count));
68
69 return;
70 }
71
72 addr = addr >> page_shift;
73 tmp = (unsigned long)addr;
74 m = find_first_bit(&tmp, sizeof(tmp));
75 skip = 1 << m;
76 mask = skip - 1;
77 i = 0;
78 for_each_sg(umem->sg_head.sgl, sg, umem->nmap, entry) {
79 len = sg_dma_len(sg) >> page_shift;
80 pfn = sg_dma_address(sg) >> page_shift;
81 for (k = 0; k < len; k++) {
82 if (!(i & mask)) {
83 tmp = (unsigned long)pfn;
84 m = min_t(unsigned long, m, find_first_bit(&tmp, sizeof(tmp)));
85 skip = 1 << m;
86 mask = skip - 1;
87 base = pfn;
88 p = 0;
89 } else {
90 if (base + p != pfn) {
91 tmp = (unsigned long)p;
92 m = find_first_bit(&tmp, sizeof(tmp));
93 skip = 1 << m;
94 mask = skip - 1;
95 base = pfn;
96 p = 0;
97 }
98 }
99 p++;
100 i++;
101 }
102 }
103
104 if (i) {
105 m = min_t(unsigned long, ilog2(roundup_pow_of_two(i)), m);
106
107 if (order)
108 *order = ilog2(roundup_pow_of_two(i) >> m);
109
110 *ncont = DIV_ROUND_UP(i, (1 << m));
111 } else {
112 m = 0;
113
114 if (order)
115 *order = 0;
116
117 *ncont = 0;
118 }
119 *shift = page_shift + m;
120 *count = i;
121}
122
123#ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
124static u64 umem_dma_to_mtt(dma_addr_t umem_dma)
125{
126 u64 mtt_entry = umem_dma & ODP_DMA_ADDR_MASK;
127
128 if (umem_dma & ODP_READ_ALLOWED_BIT)
129 mtt_entry |= MLX5_IB_MTT_READ;
130 if (umem_dma & ODP_WRITE_ALLOWED_BIT)
131 mtt_entry |= MLX5_IB_MTT_WRITE;
132
133 return mtt_entry;
134}
135#endif
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150void __mlx5_ib_populate_pas(struct mlx5_ib_dev *dev, struct ib_umem *umem,
151 int page_shift, size_t offset, size_t num_pages,
152 __be64 *pas, int access_flags)
153{
154 unsigned long umem_page_shift = ilog2(umem->page_size);
155 int shift = page_shift - umem_page_shift;
156 int mask = (1 << shift) - 1;
157 int i, k;
158 u64 cur = 0;
159 u64 base;
160 int len;
161 struct scatterlist *sg;
162 int entry;
163#ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
164 const bool odp = umem->odp_data != NULL;
165
166 if (odp) {
167 WARN_ON(shift != 0);
168 WARN_ON(access_flags != (MLX5_IB_MTT_READ | MLX5_IB_MTT_WRITE));
169
170 for (i = 0; i < num_pages; ++i) {
171 dma_addr_t pa = umem->odp_data->dma_list[offset + i];
172
173 pas[i] = cpu_to_be64(umem_dma_to_mtt(pa));
174 }
175 return;
176 }
177#endif
178
179 i = 0;
180 for_each_sg(umem->sg_head.sgl, sg, umem->nmap, entry) {
181 len = sg_dma_len(sg) >> umem_page_shift;
182 base = sg_dma_address(sg);
183 for (k = 0; k < len; k++) {
184 if (!(i & mask)) {
185 cur = base + (k << umem_page_shift);
186 cur |= access_flags;
187
188 pas[i >> shift] = cpu_to_be64(cur);
189 mlx5_ib_dbg(dev, "pas[%d] 0x%llx\n",
190 i >> shift, be64_to_cpu(pas[i >> shift]));
191 } else
192 mlx5_ib_dbg(dev, "=====> 0x%llx\n",
193 base + (k << umem_page_shift));
194 i++;
195 }
196 }
197}
198
199void mlx5_ib_populate_pas(struct mlx5_ib_dev *dev, struct ib_umem *umem,
200 int page_shift, __be64 *pas, int access_flags)
201{
202 return __mlx5_ib_populate_pas(dev, umem, page_shift, 0,
203 ib_umem_num_pages(umem), pas,
204 access_flags);
205}
206int mlx5_ib_get_buf_offset(u64 addr, int page_shift, u32 *offset)
207{
208 u64 page_size;
209 u64 page_mask;
210 u64 off_size;
211 u64 off_mask;
212 u64 buf_off;
213
214 page_size = (u64)1 << page_shift;
215 page_mask = page_size - 1;
216 buf_off = addr & page_mask;
217 off_size = page_size >> 6;
218 off_mask = off_size - 1;
219
220 if (buf_off & off_mask)
221 return -EINVAL;
222
223 *offset = buf_off >> ilog2(off_size);
224 return 0;
225}
226