xref: /linux/drivers/soc/qcom/ocmem.c (revision 5ea5880764cbb164afb17a62e76ca75dc371409d)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * The On Chip Memory (OCMEM) allocator allows various clients to allocate
4  * memory from OCMEM based on performance, latency and power requirements.
5  * This is typically used by the GPU, camera/video, and audio components on
6  * some Snapdragon SoCs.
7  *
8  * Copyright (C) 2019 Brian Masney <masneyb@onstation.org>
9  * Copyright (C) 2015 Red Hat. Author: Rob Clark <robdclark@gmail.com>
10  */
11 
12 #include <linux/bitfield.h>
13 #include <linux/cleanup.h>
14 #include <linux/clk.h>
15 #include <linux/io.h>
16 #include <linux/kernel.h>
17 #include <linux/module.h>
18 #include <linux/of.h>
19 #include <linux/of_platform.h>
20 #include <linux/platform_device.h>
21 #include <linux/firmware/qcom/qcom_scm.h>
22 #include <linux/sizes.h>
23 #include <linux/slab.h>
24 #include <linux/types.h>
25 #include <soc/qcom/ocmem.h>
26 
27 enum region_mode {
28 	WIDE_MODE = 0x0,
29 	THIN_MODE,
30 	MODE_DEFAULT = WIDE_MODE,
31 };
32 
33 enum ocmem_macro_state {
34 	PASSTHROUGH = 0,
35 	PERI_ON = 1,
36 	CORE_ON = 2,
37 	CLK_OFF = 4,
38 };
39 
40 struct ocmem_region {
41 	bool interleaved;
42 	enum region_mode mode;
43 	unsigned int num_macros;
44 	enum ocmem_macro_state macro_state[4];
45 	unsigned long macro_size;
46 	unsigned long region_size;
47 };
48 
49 struct ocmem_config {
50 	uint8_t num_regions;
51 	unsigned long macro_size;
52 };
53 
54 struct ocmem {
55 	struct device *dev;
56 	const struct ocmem_config *config;
57 	struct resource *memory;
58 	void __iomem *mmio;
59 	struct clk *core_clk;
60 	struct clk *iface_clk;
61 	unsigned int num_ports;
62 	unsigned int num_macros;
63 	bool interleaved;
64 	struct ocmem_region *regions;
65 	unsigned long active_allocations;
66 };
67 
68 #define OCMEM_MIN_ALIGN				SZ_64K
69 #define OCMEM_MIN_ALLOC				SZ_64K
70 
71 #define OCMEM_REG_HW_VERSION			0x00000000
72 #define OCMEM_REG_HW_PROFILE			0x00000004
73 
74 #define OCMEM_REG_REGION_MODE_CTL		0x00001000
75 #define OCMEM_REGION_MODE_CTL_REG0_THIN		0x00000001
76 #define OCMEM_REGION_MODE_CTL_REG1_THIN		0x00000002
77 #define OCMEM_REGION_MODE_CTL_REG2_THIN		0x00000004
78 #define OCMEM_REGION_MODE_CTL_REG3_THIN		0x00000008
79 
80 #define OCMEM_REG_GFX_MPU_START			0x00001004
81 #define OCMEM_REG_GFX_MPU_END			0x00001008
82 
83 #define OCMEM_HW_VERSION_MAJOR(val)		FIELD_GET(GENMASK(31, 28), val)
84 #define OCMEM_HW_VERSION_MINOR(val)		FIELD_GET(GENMASK(27, 16), val)
85 #define OCMEM_HW_VERSION_STEP(val)		FIELD_GET(GENMASK(15, 0), val)
86 
87 #define OCMEM_HW_PROFILE_NUM_PORTS(val)		FIELD_GET(0x0000000f, (val))
88 #define OCMEM_HW_PROFILE_NUM_MACROS(val)	FIELD_GET(0x00003f00, (val))
89 
90 #define OCMEM_HW_PROFILE_LAST_REGN_HALFSIZE	0x00010000
91 #define OCMEM_HW_PROFILE_INTERLEAVING		0x00020000
92 #define OCMEM_REG_GEN_STATUS			0x0000000c
93 
94 #define OCMEM_REG_PSGSC_STATUS			0x00000038
95 #define OCMEM_REG_PSGSC_CTL(i0)			(0x0000003c + 0x1*(i0))
96 
97 #define OCMEM_PSGSC_CTL_MACRO0_MODE(val)	FIELD_PREP(0x00000007, (val))
98 #define OCMEM_PSGSC_CTL_MACRO1_MODE(val)	FIELD_PREP(0x00000070, (val))
99 #define OCMEM_PSGSC_CTL_MACRO2_MODE(val)	FIELD_PREP(0x00000700, (val))
100 #define OCMEM_PSGSC_CTL_MACRO3_MODE(val)	FIELD_PREP(0x00007000, (val))
101 
102 static inline void ocmem_write(struct ocmem *ocmem, u32 reg, u32 data)
103 {
104 	writel(data, ocmem->mmio + reg);
105 }
106 
107 static inline u32 ocmem_read(struct ocmem *ocmem, u32 reg)
108 {
109 	return readl(ocmem->mmio + reg);
110 }
111 
112 static void update_ocmem(struct ocmem *ocmem)
113 {
114 	uint32_t region_mode_ctrl = 0x0;
115 	int i;
116 
117 	if (!qcom_scm_ocmem_lock_available()) {
118 		for (i = 0; i < ocmem->config->num_regions; i++) {
119 			struct ocmem_region *region = &ocmem->regions[i];
120 
121 			if (region->mode == THIN_MODE)
122 				region_mode_ctrl |= BIT(i);
123 		}
124 
125 		dev_dbg(ocmem->dev, "ocmem_region_mode_control %x\n",
126 			region_mode_ctrl);
127 		ocmem_write(ocmem, OCMEM_REG_REGION_MODE_CTL, region_mode_ctrl);
128 	}
129 
130 	for (i = 0; i < ocmem->config->num_regions; i++) {
131 		struct ocmem_region *region = &ocmem->regions[i];
132 		u32 data;
133 
134 		data = OCMEM_PSGSC_CTL_MACRO0_MODE(region->macro_state[0]) |
135 			OCMEM_PSGSC_CTL_MACRO1_MODE(region->macro_state[1]) |
136 			OCMEM_PSGSC_CTL_MACRO2_MODE(region->macro_state[2]) |
137 			OCMEM_PSGSC_CTL_MACRO3_MODE(region->macro_state[3]);
138 
139 		ocmem_write(ocmem, OCMEM_REG_PSGSC_CTL(i), data);
140 	}
141 }
142 
143 static unsigned long phys_to_offset(struct ocmem *ocmem,
144 				    unsigned long addr)
145 {
146 	if (addr < ocmem->memory->start || addr >= ocmem->memory->end)
147 		return 0;
148 
149 	return addr - ocmem->memory->start;
150 }
151 
152 static unsigned long device_address(struct ocmem *ocmem,
153 				    enum ocmem_client client,
154 				    unsigned long addr)
155 {
156 	WARN_ON(client != OCMEM_GRAPHICS);
157 
158 	/* TODO: gpu uses phys_to_offset, but others do not.. */
159 	return phys_to_offset(ocmem, addr);
160 }
161 
162 static void update_range(struct ocmem *ocmem, struct ocmem_buf *buf,
163 			 enum ocmem_macro_state mstate, enum region_mode rmode)
164 {
165 	unsigned long offset = 0;
166 	int i, j;
167 
168 	for (i = 0; i < ocmem->config->num_regions; i++) {
169 		struct ocmem_region *region = &ocmem->regions[i];
170 
171 		if (buf->offset <= offset && offset < buf->offset + buf->len)
172 			region->mode = rmode;
173 
174 		for (j = 0; j < region->num_macros; j++) {
175 			if (buf->offset <= offset &&
176 			    offset < buf->offset + buf->len)
177 				region->macro_state[j] = mstate;
178 
179 			offset += region->macro_size;
180 		}
181 	}
182 
183 	update_ocmem(ocmem);
184 }
185 
186 struct ocmem *of_get_ocmem(struct device *dev)
187 {
188 	struct platform_device *pdev;
189 	struct ocmem *ocmem;
190 
191 	struct device_node *devnode __free(device_node) = of_parse_phandle(dev->of_node,
192 									   "sram", 0);
193 	if (!devnode || !devnode->parent) {
194 		dev_err(dev, "Cannot look up sram phandle\n");
195 		return ERR_PTR(-ENODEV);
196 	}
197 
198 	pdev = of_find_device_by_node(devnode->parent);
199 	if (!pdev)
200 		return dev_err_ptr_probe(dev, -EPROBE_DEFER,
201 					 "Cannot find device node %s\n",
202 					 devnode->name);
203 
204 	ocmem = platform_get_drvdata(pdev);
205 	put_device(&pdev->dev);
206 	if (!ocmem)
207 		return dev_err_ptr_probe(dev, -EPROBE_DEFER, "Cannot get ocmem\n");
208 
209 	return ocmem;
210 }
211 EXPORT_SYMBOL_GPL(of_get_ocmem);
212 
213 struct ocmem_buf *ocmem_allocate(struct ocmem *ocmem, enum ocmem_client client,
214 				 unsigned long size)
215 {
216 	int ret;
217 
218 	/* TODO: add support for other clients... */
219 	if (WARN_ON(client != OCMEM_GRAPHICS))
220 		return ERR_PTR(-ENODEV);
221 
222 	if (size < OCMEM_MIN_ALLOC || !IS_ALIGNED(size, OCMEM_MIN_ALIGN))
223 		return ERR_PTR(-EINVAL);
224 
225 	if (test_and_set_bit_lock(BIT(client), &ocmem->active_allocations))
226 		return ERR_PTR(-EBUSY);
227 
228 	struct ocmem_buf *buf __free(kfree) = kzalloc_obj(*buf);
229 	if (!buf) {
230 		ret = -ENOMEM;
231 		goto err_unlock;
232 	}
233 
234 	buf->offset = 0;
235 	buf->addr = device_address(ocmem, client, buf->offset);
236 	buf->len = size;
237 
238 	update_range(ocmem, buf, CORE_ON, WIDE_MODE);
239 
240 	if (qcom_scm_ocmem_lock_available()) {
241 		ret = qcom_scm_ocmem_lock(QCOM_SCM_OCMEM_GRAPHICS_ID,
242 					  buf->offset, buf->len, WIDE_MODE);
243 		if (ret) {
244 			dev_err(ocmem->dev, "could not lock: %d\n", ret);
245 			ret = -EINVAL;
246 			goto err_unlock;
247 		}
248 	} else {
249 		ocmem_write(ocmem, OCMEM_REG_GFX_MPU_START, buf->offset);
250 		ocmem_write(ocmem, OCMEM_REG_GFX_MPU_END,
251 			    buf->offset + buf->len);
252 	}
253 
254 	dev_dbg(ocmem->dev, "using %ldK of OCMEM at 0x%08lx for client %d\n",
255 		size / 1024, buf->addr, client);
256 
257 	return_ptr(buf);
258 
259 err_unlock:
260 	clear_bit_unlock(BIT(client), &ocmem->active_allocations);
261 
262 	return ERR_PTR(ret);
263 }
264 EXPORT_SYMBOL_GPL(ocmem_allocate);
265 
266 void ocmem_free(struct ocmem *ocmem, enum ocmem_client client,
267 		struct ocmem_buf *buf)
268 {
269 	/* TODO: add support for other clients... */
270 	if (WARN_ON(client != OCMEM_GRAPHICS))
271 		return;
272 
273 	update_range(ocmem, buf, CLK_OFF, MODE_DEFAULT);
274 
275 	if (qcom_scm_ocmem_lock_available()) {
276 		int ret;
277 
278 		ret = qcom_scm_ocmem_unlock(QCOM_SCM_OCMEM_GRAPHICS_ID,
279 					    buf->offset, buf->len);
280 		if (ret)
281 			dev_err(ocmem->dev, "could not unlock: %d\n", ret);
282 	} else {
283 		ocmem_write(ocmem, OCMEM_REG_GFX_MPU_START, 0x0);
284 		ocmem_write(ocmem, OCMEM_REG_GFX_MPU_END, 0x0);
285 	}
286 
287 	kfree(buf);
288 
289 	clear_bit_unlock(BIT(client), &ocmem->active_allocations);
290 }
291 EXPORT_SYMBOL_GPL(ocmem_free);
292 
293 static int ocmem_dev_probe(struct platform_device *pdev)
294 {
295 	struct device *dev = &pdev->dev;
296 	unsigned long reg, region_size;
297 	int i, j, ret, num_banks;
298 	struct ocmem *ocmem;
299 
300 	if (!qcom_scm_is_available())
301 		return -EPROBE_DEFER;
302 
303 	ocmem = devm_kzalloc(dev, sizeof(*ocmem), GFP_KERNEL);
304 	if (!ocmem)
305 		return -ENOMEM;
306 
307 	ocmem->dev = dev;
308 	ocmem->config = device_get_match_data(dev);
309 
310 	ocmem->core_clk = devm_clk_get_optional(dev, "core");
311 	if (IS_ERR(ocmem->core_clk))
312 		return dev_err_probe(dev, PTR_ERR(ocmem->core_clk),
313 				     "Unable to get core clock\n");
314 
315 	ocmem->iface_clk = devm_clk_get_optional(dev, "iface");
316 	if (IS_ERR(ocmem->iface_clk))
317 		return dev_err_probe(dev, PTR_ERR(ocmem->iface_clk),
318 				     "Unable to get iface clock\n");
319 
320 	ocmem->mmio = devm_platform_ioremap_resource_byname(pdev, "ctrl");
321 	if (IS_ERR(ocmem->mmio))
322 		return dev_err_probe(&pdev->dev, PTR_ERR(ocmem->mmio),
323 				     "Failed to ioremap ocmem_ctrl resource\n");
324 
325 	ocmem->memory = platform_get_resource_byname(pdev, IORESOURCE_MEM,
326 						     "mem");
327 	if (!ocmem->memory) {
328 		dev_err(dev, "Could not get mem region\n");
329 		return -ENXIO;
330 	}
331 
332 	/* The core clock is synchronous with graphics */
333 	WARN_ON(clk_set_rate(ocmem->core_clk, 1000) < 0);
334 
335 	ret = clk_prepare_enable(ocmem->core_clk);
336 	if (ret)
337 		return dev_err_probe(ocmem->dev, ret, "Failed to enable core clock\n");
338 
339 	ret = clk_prepare_enable(ocmem->iface_clk);
340 	if (ret) {
341 		clk_disable_unprepare(ocmem->core_clk);
342 		return dev_err_probe(ocmem->dev, ret, "Failed to enable iface clock\n");
343 	}
344 
345 	if (qcom_scm_restore_sec_cfg_available()) {
346 		dev_dbg(dev, "configuring scm\n");
347 		ret = qcom_scm_restore_sec_cfg(QCOM_SCM_OCMEM_DEV_ID, 0);
348 		if (ret) {
349 			dev_err_probe(dev, ret, "Could not enable secure configuration\n");
350 			goto err_clk_disable;
351 		}
352 	}
353 
354 	reg = ocmem_read(ocmem, OCMEM_REG_HW_VERSION);
355 	dev_dbg(dev, "OCMEM hardware version: %lu.%lu.%lu\n",
356 		OCMEM_HW_VERSION_MAJOR(reg),
357 		OCMEM_HW_VERSION_MINOR(reg),
358 		OCMEM_HW_VERSION_STEP(reg));
359 
360 	reg = ocmem_read(ocmem, OCMEM_REG_HW_PROFILE);
361 	ocmem->num_ports = OCMEM_HW_PROFILE_NUM_PORTS(reg);
362 	ocmem->num_macros = OCMEM_HW_PROFILE_NUM_MACROS(reg);
363 	ocmem->interleaved = !!(reg & OCMEM_HW_PROFILE_INTERLEAVING);
364 
365 	num_banks = ocmem->num_ports / 2;
366 	region_size = ocmem->config->macro_size * num_banks;
367 
368 	dev_info(dev, "%u ports, %u regions, %u macros, %sinterleaved\n",
369 		 ocmem->num_ports, ocmem->config->num_regions,
370 		 ocmem->num_macros, ocmem->interleaved ? "" : "not ");
371 
372 	ocmem->regions = devm_kcalloc(dev, ocmem->config->num_regions,
373 				      sizeof(struct ocmem_region), GFP_KERNEL);
374 	if (!ocmem->regions) {
375 		ret = -ENOMEM;
376 		goto err_clk_disable;
377 	}
378 
379 	for (i = 0; i < ocmem->config->num_regions; i++) {
380 		struct ocmem_region *region = &ocmem->regions[i];
381 
382 		if (WARN_ON(num_banks > ARRAY_SIZE(region->macro_state))) {
383 			ret = -EINVAL;
384 			goto err_clk_disable;
385 		}
386 
387 		region->mode = MODE_DEFAULT;
388 		region->num_macros = num_banks;
389 
390 		if (i == (ocmem->config->num_regions - 1) &&
391 		    reg & OCMEM_HW_PROFILE_LAST_REGN_HALFSIZE) {
392 			region->macro_size = ocmem->config->macro_size / 2;
393 			region->region_size = region_size / 2;
394 		} else {
395 			region->macro_size = ocmem->config->macro_size;
396 			region->region_size = region_size;
397 		}
398 
399 		for (j = 0; j < ARRAY_SIZE(region->macro_state); j++)
400 			region->macro_state[j] = CLK_OFF;
401 	}
402 
403 	platform_set_drvdata(pdev, ocmem);
404 
405 	return 0;
406 
407 err_clk_disable:
408 	clk_disable_unprepare(ocmem->core_clk);
409 	clk_disable_unprepare(ocmem->iface_clk);
410 	return ret;
411 }
412 
413 static void ocmem_dev_remove(struct platform_device *pdev)
414 {
415 	struct ocmem *ocmem = platform_get_drvdata(pdev);
416 
417 	clk_disable_unprepare(ocmem->core_clk);
418 	clk_disable_unprepare(ocmem->iface_clk);
419 }
420 
421 static const struct ocmem_config ocmem_8226_config = {
422 	.num_regions = 1,
423 	.macro_size = SZ_128K,
424 };
425 
426 static const struct ocmem_config ocmem_8974_config = {
427 	.num_regions = 3,
428 	.macro_size = SZ_128K,
429 };
430 
431 static const struct of_device_id ocmem_of_match[] = {
432 	{ .compatible = "qcom,msm8226-ocmem", .data = &ocmem_8226_config },
433 	{ .compatible = "qcom,msm8974-ocmem", .data = &ocmem_8974_config },
434 	{ }
435 };
436 
437 MODULE_DEVICE_TABLE(of, ocmem_of_match);
438 
439 static struct platform_driver ocmem_driver = {
440 	.probe = ocmem_dev_probe,
441 	.remove = ocmem_dev_remove,
442 	.driver = {
443 		.name = "ocmem",
444 		.of_match_table = ocmem_of_match,
445 	},
446 };
447 
448 module_platform_driver(ocmem_driver);
449 
450 MODULE_DESCRIPTION("On Chip Memory (OCMEM) allocator for some Snapdragon SoCs");
451 MODULE_LICENSE("GPL v2");
452