xref: /linux/drivers/gpu/host1x/hw/channel_hw.c (revision bfd5bb6f90af092aa345b15cd78143956a13c2a8)
1 /*
2  * Tegra host1x Channel
3  *
4  * Copyright (c) 2010-2013, NVIDIA Corporation.
5  *
6  * This program is free software; you can redistribute it and/or modify it
7  * under the terms and conditions of the GNU General Public License,
8  * version 2, as published by the Free Software Foundation.
9  *
10  * This program is distributed in the hope it will be useful, but WITHOUT
11  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
13  * more details.
14  *
15  * You should have received a copy of the GNU General Public License
16  * along with this program.  If not, see <http://www.gnu.org/licenses/>.
17  */
18 
19 #include <linux/host1x.h>
20 #include <linux/slab.h>
21 
22 #include <trace/events/host1x.h>
23 
24 #include "../channel.h"
25 #include "../dev.h"
26 #include "../intr.h"
27 #include "../job.h"
28 
29 #define HOST1X_CHANNEL_SIZE 16384
30 #define TRACE_MAX_LENGTH 128U
31 
32 static void trace_write_gather(struct host1x_cdma *cdma, struct host1x_bo *bo,
33 			       u32 offset, u32 words)
34 {
35 	struct device *dev = cdma_to_channel(cdma)->dev;
36 	void *mem = NULL;
37 
38 	if (host1x_debug_trace_cmdbuf)
39 		mem = host1x_bo_mmap(bo);
40 
41 	if (mem) {
42 		u32 i;
43 		/*
44 		 * Write in batches of 128 as there seems to be a limit
45 		 * of how much you can output to ftrace at once.
46 		 */
47 		for (i = 0; i < words; i += TRACE_MAX_LENGTH) {
48 			u32 num_words = min(words - i, TRACE_MAX_LENGTH);
49 
50 			offset += i * sizeof(u32);
51 
52 			trace_host1x_cdma_push_gather(dev_name(dev), bo,
53 						      num_words, offset,
54 						      mem);
55 		}
56 
57 		host1x_bo_munmap(bo, mem);
58 	}
59 }
60 
61 static void submit_gathers(struct host1x_job *job)
62 {
63 	struct host1x_cdma *cdma = &job->channel->cdma;
64 	unsigned int i;
65 
66 	for (i = 0; i < job->num_gathers; i++) {
67 		struct host1x_job_gather *g = &job->gathers[i];
68 		u32 op1 = host1x_opcode_gather(g->words);
69 		u32 op2 = g->base + g->offset;
70 
71 		trace_write_gather(cdma, g->bo, g->offset, op1 & 0xffff);
72 		host1x_cdma_push(cdma, op1, op2);
73 	}
74 }
75 
76 static inline void synchronize_syncpt_base(struct host1x_job *job)
77 {
78 	struct host1x *host = dev_get_drvdata(job->channel->dev->parent);
79 	struct host1x_syncpt *sp = host->syncpt + job->syncpt_id;
80 	unsigned int id;
81 	u32 value;
82 
83 	value = host1x_syncpt_read_max(sp);
84 	id = sp->base->id;
85 
86 	host1x_cdma_push(&job->channel->cdma,
87 			 host1x_opcode_setclass(HOST1X_CLASS_HOST1X,
88 				HOST1X_UCLASS_LOAD_SYNCPT_BASE, 1),
89 			 HOST1X_UCLASS_LOAD_SYNCPT_BASE_BASE_INDX_F(id) |
90 			 HOST1X_UCLASS_LOAD_SYNCPT_BASE_VALUE_F(value));
91 }
92 
93 static int channel_submit(struct host1x_job *job)
94 {
95 	struct host1x_channel *ch = job->channel;
96 	struct host1x_syncpt *sp;
97 	u32 user_syncpt_incrs = job->syncpt_incrs;
98 	u32 prev_max = 0;
99 	u32 syncval;
100 	int err;
101 	struct host1x_waitlist *completed_waiter = NULL;
102 	struct host1x *host = dev_get_drvdata(ch->dev->parent);
103 
104 	sp = host->syncpt + job->syncpt_id;
105 	trace_host1x_channel_submit(dev_name(ch->dev),
106 				    job->num_gathers, job->num_relocs,
107 				    job->syncpt_id, job->syncpt_incrs);
108 
109 	/* before error checks, return current max */
110 	prev_max = job->syncpt_end = host1x_syncpt_read_max(sp);
111 
112 	/* get submit lock */
113 	err = mutex_lock_interruptible(&ch->submitlock);
114 	if (err)
115 		goto error;
116 
117 	completed_waiter = kzalloc(sizeof(*completed_waiter), GFP_KERNEL);
118 	if (!completed_waiter) {
119 		mutex_unlock(&ch->submitlock);
120 		err = -ENOMEM;
121 		goto error;
122 	}
123 
124 	/* begin a CDMA submit */
125 	err = host1x_cdma_begin(&ch->cdma, job);
126 	if (err) {
127 		mutex_unlock(&ch->submitlock);
128 		goto error;
129 	}
130 
131 	if (job->serialize) {
132 		/*
133 		 * Force serialization by inserting a host wait for the
134 		 * previous job to finish before this one can commence.
135 		 */
136 		host1x_cdma_push(&ch->cdma,
137 				 host1x_opcode_setclass(HOST1X_CLASS_HOST1X,
138 					host1x_uclass_wait_syncpt_r(), 1),
139 				 host1x_class_host_wait_syncpt(job->syncpt_id,
140 					host1x_syncpt_read_max(sp)));
141 	}
142 
143 	/* Synchronize base register to allow using it for relative waiting */
144 	if (sp->base)
145 		synchronize_syncpt_base(job);
146 
147 	syncval = host1x_syncpt_incr_max(sp, user_syncpt_incrs);
148 
149 	host1x_hw_syncpt_assign_to_channel(host, sp, ch);
150 
151 	job->syncpt_end = syncval;
152 
153 	/* add a setclass for modules that require it */
154 	if (job->class)
155 		host1x_cdma_push(&ch->cdma,
156 				 host1x_opcode_setclass(job->class, 0, 0),
157 				 HOST1X_OPCODE_NOP);
158 
159 	submit_gathers(job);
160 
161 	/* end CDMA submit & stash pinned hMems into sync queue */
162 	host1x_cdma_end(&ch->cdma, job);
163 
164 	trace_host1x_channel_submitted(dev_name(ch->dev), prev_max, syncval);
165 
166 	/* schedule a submit complete interrupt */
167 	err = host1x_intr_add_action(host, sp, syncval,
168 				     HOST1X_INTR_ACTION_SUBMIT_COMPLETE, ch,
169 				     completed_waiter, NULL);
170 	completed_waiter = NULL;
171 	WARN(err, "Failed to set submit complete interrupt");
172 
173 	mutex_unlock(&ch->submitlock);
174 
175 	return 0;
176 
177 error:
178 	kfree(completed_waiter);
179 	return err;
180 }
181 
182 static void enable_gather_filter(struct host1x *host,
183 				 struct host1x_channel *ch)
184 {
185 #if HOST1X_HW >= 6
186 	u32 val;
187 
188 	if (!host->hv_regs)
189 		return;
190 
191 	val = host1x_hypervisor_readl(
192 		host, HOST1X_HV_CH_KERNEL_FILTER_GBUFFER(ch->id / 32));
193 	val |= BIT(ch->id % 32);
194 	host1x_hypervisor_writel(
195 		host, val, HOST1X_HV_CH_KERNEL_FILTER_GBUFFER(ch->id / 32));
196 #elif HOST1X_HW >= 4
197 	host1x_ch_writel(ch,
198 			 HOST1X_CHANNEL_CHANNELCTRL_KERNEL_FILTER_GBUFFER(1),
199 			 HOST1X_CHANNEL_CHANNELCTRL);
200 #endif
201 }
202 
203 static int host1x_channel_init(struct host1x_channel *ch, struct host1x *dev,
204 			       unsigned int index)
205 {
206 	ch->regs = dev->regs + index * HOST1X_CHANNEL_SIZE;
207 	enable_gather_filter(dev, ch);
208 	return 0;
209 }
210 
211 static const struct host1x_channel_ops host1x_channel_ops = {
212 	.init = host1x_channel_init,
213 	.submit = channel_submit,
214 };
215