1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * (C) COPYRIGHT 2011-2023 ARM Limited. All rights reserved.
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * This program is free software and is provided to you under the terms of the
7*4882a593Smuzhiyun * GNU General Public License version 2 as published by the Free Software
8*4882a593Smuzhiyun * Foundation, and any use by you of this program is subject to the terms
9*4882a593Smuzhiyun * of such GNU license.
10*4882a593Smuzhiyun *
11*4882a593Smuzhiyun * This program is distributed in the hope that it will be useful,
12*4882a593Smuzhiyun * but WITHOUT ANY WARRANTY; without even the implied warranty of
13*4882a593Smuzhiyun * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14*4882a593Smuzhiyun * GNU General Public License for more details.
15*4882a593Smuzhiyun *
16*4882a593Smuzhiyun * You should have received a copy of the GNU General Public License
17*4882a593Smuzhiyun * along with this program; if not, you can access it online at
18*4882a593Smuzhiyun * http://www.gnu.org/licenses/gpl-2.0.html.
19*4882a593Smuzhiyun *
20*4882a593Smuzhiyun */
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun /*
23*4882a593Smuzhiyun * Job Scheduler Implementation
24*4882a593Smuzhiyun */
25*4882a593Smuzhiyun #include <mali_kbase.h>
26*4882a593Smuzhiyun #include <mali_kbase_js.h>
27*4882a593Smuzhiyun #include <tl/mali_kbase_tracepoints.h>
28*4882a593Smuzhiyun #include <mali_linux_trace.h>
29*4882a593Smuzhiyun #include <mali_kbase_hw.h>
30*4882a593Smuzhiyun #include <mali_kbase_ctx_sched.h>
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun #include <mali_kbase_defs.h>
33*4882a593Smuzhiyun #include <mali_kbase_config_defaults.h>
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun #include "mali_kbase_jm.h"
36*4882a593Smuzhiyun #include "mali_kbase_hwaccess_jm.h"
37*4882a593Smuzhiyun #include <mali_kbase_hwaccess_time.h>
38*4882a593Smuzhiyun #include <linux/priority_control_manager.h>
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun /*
41*4882a593Smuzhiyun * Private types
42*4882a593Smuzhiyun */
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun /* Bitpattern indicating the result of releasing a context */
45*4882a593Smuzhiyun enum {
46*4882a593Smuzhiyun /* The context was descheduled - caller should try scheduling in a new
47*4882a593Smuzhiyun * one to keep the runpool full
48*4882a593Smuzhiyun */
49*4882a593Smuzhiyun KBASEP_JS_RELEASE_RESULT_WAS_DESCHEDULED = (1u << 0),
50*4882a593Smuzhiyun /* Ctx attributes were changed - caller should try scheduling all
51*4882a593Smuzhiyun * contexts
52*4882a593Smuzhiyun */
53*4882a593Smuzhiyun KBASEP_JS_RELEASE_RESULT_SCHED_ALL = (1u << 1)
54*4882a593Smuzhiyun };
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun typedef u32 kbasep_js_release_result;
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun const int kbasep_js_atom_priority_to_relative[BASE_JD_NR_PRIO_LEVELS] = {
59*4882a593Smuzhiyun KBASE_JS_ATOM_SCHED_PRIO_MED, /* BASE_JD_PRIO_MEDIUM */
60*4882a593Smuzhiyun KBASE_JS_ATOM_SCHED_PRIO_HIGH, /* BASE_JD_PRIO_HIGH */
61*4882a593Smuzhiyun KBASE_JS_ATOM_SCHED_PRIO_LOW, /* BASE_JD_PRIO_LOW */
62*4882a593Smuzhiyun KBASE_JS_ATOM_SCHED_PRIO_REALTIME /* BASE_JD_PRIO_REALTIME */
63*4882a593Smuzhiyun };
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun const base_jd_prio
66*4882a593Smuzhiyun kbasep_js_relative_priority_to_atom[KBASE_JS_ATOM_SCHED_PRIO_COUNT] = {
67*4882a593Smuzhiyun BASE_JD_PRIO_REALTIME, /* KBASE_JS_ATOM_SCHED_PRIO_REALTIME */
68*4882a593Smuzhiyun BASE_JD_PRIO_HIGH, /* KBASE_JS_ATOM_SCHED_PRIO_HIGH */
69*4882a593Smuzhiyun BASE_JD_PRIO_MEDIUM, /* KBASE_JS_ATOM_SCHED_PRIO_MED */
70*4882a593Smuzhiyun BASE_JD_PRIO_LOW /* KBASE_JS_ATOM_SCHED_PRIO_LOW */
71*4882a593Smuzhiyun };
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun /*
75*4882a593Smuzhiyun * Private function prototypes
76*4882a593Smuzhiyun */
77*4882a593Smuzhiyun static kbasep_js_release_result kbasep_js_runpool_release_ctx_internal(
78*4882a593Smuzhiyun struct kbase_device *kbdev, struct kbase_context *kctx,
79*4882a593Smuzhiyun struct kbasep_js_atom_retained_state *katom_retained_state);
80*4882a593Smuzhiyun
81*4882a593Smuzhiyun static unsigned int kbase_js_get_slot(struct kbase_device *kbdev, struct kbase_jd_atom *katom);
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun static void kbase_js_foreach_ctx_job(struct kbase_context *kctx,
84*4882a593Smuzhiyun kbasep_js_ctx_job_cb *callback);
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun /* Helper for ktrace */
87*4882a593Smuzhiyun #if KBASE_KTRACE_ENABLE
kbase_ktrace_get_ctx_refcnt(struct kbase_context * kctx)88*4882a593Smuzhiyun static int kbase_ktrace_get_ctx_refcnt(struct kbase_context *kctx)
89*4882a593Smuzhiyun {
90*4882a593Smuzhiyun return atomic_read(&kctx->refcount);
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun #else /* KBASE_KTRACE_ENABLE */
kbase_ktrace_get_ctx_refcnt(struct kbase_context * kctx)93*4882a593Smuzhiyun static int kbase_ktrace_get_ctx_refcnt(struct kbase_context *kctx)
94*4882a593Smuzhiyun {
95*4882a593Smuzhiyun CSTD_UNUSED(kctx);
96*4882a593Smuzhiyun return 0;
97*4882a593Smuzhiyun }
98*4882a593Smuzhiyun #endif /* KBASE_KTRACE_ENABLE */
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun /*
101*4882a593Smuzhiyun * Private functions
102*4882a593Smuzhiyun */
103*4882a593Smuzhiyun
104*4882a593Smuzhiyun /**
105*4882a593Smuzhiyun * core_reqs_from_jsn_features - Convert JSn_FEATURES to core requirements
106*4882a593Smuzhiyun * @features: JSn_FEATURE register value
107*4882a593Smuzhiyun *
108*4882a593Smuzhiyun * Given a JSn_FEATURE register value returns the core requirements that match
109*4882a593Smuzhiyun *
110*4882a593Smuzhiyun * Return: Core requirement bit mask
111*4882a593Smuzhiyun */
core_reqs_from_jsn_features(u16 features)112*4882a593Smuzhiyun static base_jd_core_req core_reqs_from_jsn_features(u16 features)
113*4882a593Smuzhiyun {
114*4882a593Smuzhiyun base_jd_core_req core_req = 0u;
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun if ((features & JS_FEATURE_SET_VALUE_JOB) != 0)
117*4882a593Smuzhiyun core_req |= BASE_JD_REQ_V;
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun if ((features & JS_FEATURE_CACHE_FLUSH_JOB) != 0)
120*4882a593Smuzhiyun core_req |= BASE_JD_REQ_CF;
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun if ((features & JS_FEATURE_COMPUTE_JOB) != 0)
123*4882a593Smuzhiyun core_req |= BASE_JD_REQ_CS;
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun if ((features & JS_FEATURE_TILER_JOB) != 0)
126*4882a593Smuzhiyun core_req |= BASE_JD_REQ_T;
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun if ((features & JS_FEATURE_FRAGMENT_JOB) != 0)
129*4882a593Smuzhiyun core_req |= BASE_JD_REQ_FS;
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun return core_req;
132*4882a593Smuzhiyun }
133*4882a593Smuzhiyun
kbase_js_sync_timers(struct kbase_device * kbdev)134*4882a593Smuzhiyun static void kbase_js_sync_timers(struct kbase_device *kbdev)
135*4882a593Smuzhiyun {
136*4882a593Smuzhiyun mutex_lock(&kbdev->js_data.runpool_mutex);
137*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
138*4882a593Smuzhiyun mutex_unlock(&kbdev->js_data.runpool_mutex);
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun /**
142*4882a593Smuzhiyun * jsctx_rb_none_to_pull_prio(): - Check if there are no pullable atoms
143*4882a593Smuzhiyun * @kctx: Pointer to kbase context with ring buffer.
144*4882a593Smuzhiyun * @js: Job slot id to check.
145*4882a593Smuzhiyun * @prio: Priority to check.
146*4882a593Smuzhiyun *
147*4882a593Smuzhiyun * Return true if there are no atoms to pull. There may be running atoms in the
148*4882a593Smuzhiyun * ring buffer even if there are no atoms to pull. It is also possible for the
149*4882a593Smuzhiyun * ring buffer to be full (with running atoms) when this functions returns
150*4882a593Smuzhiyun * true.
151*4882a593Smuzhiyun *
152*4882a593Smuzhiyun * Return: true if there are no atoms to pull, false otherwise.
153*4882a593Smuzhiyun */
jsctx_rb_none_to_pull_prio(struct kbase_context * kctx,unsigned int js,int prio)154*4882a593Smuzhiyun static inline bool jsctx_rb_none_to_pull_prio(struct kbase_context *kctx, unsigned int js, int prio)
155*4882a593Smuzhiyun {
156*4882a593Smuzhiyun bool none_to_pull;
157*4882a593Smuzhiyun struct jsctx_queue *rb = &kctx->jsctx_queue[prio][js];
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun none_to_pull = RB_EMPTY_ROOT(&rb->runnable_tree);
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Slot %u (prio %d) is %spullable in kctx %pK\n", js, prio,
164*4882a593Smuzhiyun none_to_pull ? "not " : "", kctx);
165*4882a593Smuzhiyun
166*4882a593Smuzhiyun return none_to_pull;
167*4882a593Smuzhiyun }
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun /**
170*4882a593Smuzhiyun * jsctx_rb_none_to_pull(): - Check if all priority ring buffers have no
171*4882a593Smuzhiyun * pullable atoms
172*4882a593Smuzhiyun * @kctx: Pointer to kbase context with ring buffer.
173*4882a593Smuzhiyun * @js: Job slot id to check.
174*4882a593Smuzhiyun *
175*4882a593Smuzhiyun * Caller must hold hwaccess_lock
176*4882a593Smuzhiyun *
177*4882a593Smuzhiyun * Return: true if the ring buffers for all priorities have no pullable atoms,
178*4882a593Smuzhiyun * false otherwise.
179*4882a593Smuzhiyun */
jsctx_rb_none_to_pull(struct kbase_context * kctx,unsigned int js)180*4882a593Smuzhiyun static inline bool jsctx_rb_none_to_pull(struct kbase_context *kctx, unsigned int js)
181*4882a593Smuzhiyun {
182*4882a593Smuzhiyun int prio;
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun for (prio = KBASE_JS_ATOM_SCHED_PRIO_FIRST;
187*4882a593Smuzhiyun prio < KBASE_JS_ATOM_SCHED_PRIO_COUNT; prio++) {
188*4882a593Smuzhiyun if (!jsctx_rb_none_to_pull_prio(kctx, js, prio))
189*4882a593Smuzhiyun return false;
190*4882a593Smuzhiyun }
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun return true;
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun /**
196*4882a593Smuzhiyun * jsctx_queue_foreach_prio(): - Execute callback for each entry in the queue.
197*4882a593Smuzhiyun * @kctx: Pointer to kbase context with the queue.
198*4882a593Smuzhiyun * @js: Job slot id to iterate.
199*4882a593Smuzhiyun * @prio: Priority id to iterate.
200*4882a593Smuzhiyun * @callback: Function pointer to callback.
201*4882a593Smuzhiyun *
202*4882a593Smuzhiyun * Iterate over a queue and invoke @callback for each entry in the queue, and
203*4882a593Smuzhiyun * remove the entry from the queue.
204*4882a593Smuzhiyun *
205*4882a593Smuzhiyun * If entries are added to the queue while this is running those entries may, or
206*4882a593Smuzhiyun * may not be covered. To ensure that all entries in the buffer have been
207*4882a593Smuzhiyun * enumerated when this function returns jsctx->lock must be held when calling
208*4882a593Smuzhiyun * this function.
209*4882a593Smuzhiyun *
210*4882a593Smuzhiyun * The HW access lock must always be held when calling this function.
211*4882a593Smuzhiyun */
jsctx_queue_foreach_prio(struct kbase_context * kctx,unsigned int js,int prio,kbasep_js_ctx_job_cb * callback)212*4882a593Smuzhiyun static void jsctx_queue_foreach_prio(struct kbase_context *kctx, unsigned int js, int prio,
213*4882a593Smuzhiyun kbasep_js_ctx_job_cb *callback)
214*4882a593Smuzhiyun {
215*4882a593Smuzhiyun struct jsctx_queue *queue = &kctx->jsctx_queue[prio][js];
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun while (!RB_EMPTY_ROOT(&queue->runnable_tree)) {
220*4882a593Smuzhiyun struct rb_node *node = rb_first(&queue->runnable_tree);
221*4882a593Smuzhiyun struct kbase_jd_atom *entry = rb_entry(node,
222*4882a593Smuzhiyun struct kbase_jd_atom, runnable_tree_node);
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun rb_erase(node, &queue->runnable_tree);
225*4882a593Smuzhiyun callback(kctx->kbdev, entry);
226*4882a593Smuzhiyun
227*4882a593Smuzhiyun /* Runnable end-of-renderpass atoms can also be in the linked
228*4882a593Smuzhiyun * list of atoms blocked on cross-slot dependencies. Remove them
229*4882a593Smuzhiyun * to avoid calling the callback twice.
230*4882a593Smuzhiyun */
231*4882a593Smuzhiyun if (entry->atom_flags & KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST) {
232*4882a593Smuzhiyun WARN_ON(!(entry->core_req &
233*4882a593Smuzhiyun BASE_JD_REQ_END_RENDERPASS));
234*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
235*4882a593Smuzhiyun "Del runnable atom %pK from X_DEP list\n",
236*4882a593Smuzhiyun (void *)entry);
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun list_del(&entry->queue);
239*4882a593Smuzhiyun entry->atom_flags &=
240*4882a593Smuzhiyun ~KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST;
241*4882a593Smuzhiyun }
242*4882a593Smuzhiyun }
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun while (!list_empty(&queue->x_dep_head)) {
245*4882a593Smuzhiyun struct kbase_jd_atom *entry = list_entry(queue->x_dep_head.next,
246*4882a593Smuzhiyun struct kbase_jd_atom, queue);
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun WARN_ON(!(entry->atom_flags &
249*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST));
250*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
251*4882a593Smuzhiyun "Del blocked atom %pK from X_DEP list\n",
252*4882a593Smuzhiyun (void *)entry);
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun list_del(queue->x_dep_head.next);
255*4882a593Smuzhiyun entry->atom_flags &=
256*4882a593Smuzhiyun ~KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST;
257*4882a593Smuzhiyun
258*4882a593Smuzhiyun callback(kctx->kbdev, entry);
259*4882a593Smuzhiyun }
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun
262*4882a593Smuzhiyun /**
263*4882a593Smuzhiyun * jsctx_queue_foreach(): - Execute callback for each entry in every queue
264*4882a593Smuzhiyun * @kctx: Pointer to kbase context with queue.
265*4882a593Smuzhiyun * @js: Job slot id to iterate.
266*4882a593Smuzhiyun * @callback: Function pointer to callback.
267*4882a593Smuzhiyun *
268*4882a593Smuzhiyun * Iterate over all the different priorities, and for each call
269*4882a593Smuzhiyun * jsctx_queue_foreach_prio() to iterate over the queue and invoke @callback
270*4882a593Smuzhiyun * for each entry, and remove the entry from the queue.
271*4882a593Smuzhiyun */
jsctx_queue_foreach(struct kbase_context * kctx,unsigned int js,kbasep_js_ctx_job_cb * callback)272*4882a593Smuzhiyun static inline void jsctx_queue_foreach(struct kbase_context *kctx, unsigned int js,
273*4882a593Smuzhiyun kbasep_js_ctx_job_cb *callback)
274*4882a593Smuzhiyun {
275*4882a593Smuzhiyun int prio;
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun for (prio = KBASE_JS_ATOM_SCHED_PRIO_FIRST;
278*4882a593Smuzhiyun prio < KBASE_JS_ATOM_SCHED_PRIO_COUNT; prio++)
279*4882a593Smuzhiyun jsctx_queue_foreach_prio(kctx, js, prio, callback);
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun /**
283*4882a593Smuzhiyun * jsctx_rb_peek_prio(): - Check buffer and get next atom
284*4882a593Smuzhiyun * @kctx: Pointer to kbase context with ring buffer.
285*4882a593Smuzhiyun * @js: Job slot id to check.
286*4882a593Smuzhiyun * @prio: Priority id to check.
287*4882a593Smuzhiyun *
288*4882a593Smuzhiyun * Check the ring buffer for the specified @js and @prio and return a pointer to
289*4882a593Smuzhiyun * the next atom, unless the ring buffer is empty.
290*4882a593Smuzhiyun *
291*4882a593Smuzhiyun * Return: Pointer to next atom in buffer, or NULL if there is no atom.
292*4882a593Smuzhiyun */
jsctx_rb_peek_prio(struct kbase_context * kctx,unsigned int js,int prio)293*4882a593Smuzhiyun static inline struct kbase_jd_atom *jsctx_rb_peek_prio(struct kbase_context *kctx, unsigned int js,
294*4882a593Smuzhiyun int prio)
295*4882a593Smuzhiyun {
296*4882a593Smuzhiyun struct jsctx_queue *rb = &kctx->jsctx_queue[prio][js];
297*4882a593Smuzhiyun struct rb_node *node;
298*4882a593Smuzhiyun
299*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
300*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Peeking runnable tree of kctx %pK for prio %d (s:%u)\n",
301*4882a593Smuzhiyun (void *)kctx, prio, js);
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun node = rb_first(&rb->runnable_tree);
304*4882a593Smuzhiyun if (!node) {
305*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Tree is empty\n");
306*4882a593Smuzhiyun return NULL;
307*4882a593Smuzhiyun }
308*4882a593Smuzhiyun
309*4882a593Smuzhiyun return rb_entry(node, struct kbase_jd_atom, runnable_tree_node);
310*4882a593Smuzhiyun }
311*4882a593Smuzhiyun
312*4882a593Smuzhiyun /**
313*4882a593Smuzhiyun * jsctx_rb_peek(): - Check all priority buffers and get next atom
314*4882a593Smuzhiyun * @kctx: Pointer to kbase context with ring buffer.
315*4882a593Smuzhiyun * @js: Job slot id to check.
316*4882a593Smuzhiyun *
317*4882a593Smuzhiyun * Check the ring buffers for all priorities, starting from
318*4882a593Smuzhiyun * KBASE_JS_ATOM_SCHED_PRIO_REALTIME, for the specified @js and @prio and return a
319*4882a593Smuzhiyun * pointer to the next atom, unless all the priority's ring buffers are empty.
320*4882a593Smuzhiyun *
321*4882a593Smuzhiyun * Caller must hold the hwaccess_lock.
322*4882a593Smuzhiyun *
323*4882a593Smuzhiyun * Return: Pointer to next atom in buffer, or NULL if there is no atom.
324*4882a593Smuzhiyun */
jsctx_rb_peek(struct kbase_context * kctx,unsigned int js)325*4882a593Smuzhiyun static inline struct kbase_jd_atom *jsctx_rb_peek(struct kbase_context *kctx, unsigned int js)
326*4882a593Smuzhiyun {
327*4882a593Smuzhiyun int prio;
328*4882a593Smuzhiyun
329*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
330*4882a593Smuzhiyun
331*4882a593Smuzhiyun for (prio = KBASE_JS_ATOM_SCHED_PRIO_FIRST;
332*4882a593Smuzhiyun prio < KBASE_JS_ATOM_SCHED_PRIO_COUNT; prio++) {
333*4882a593Smuzhiyun struct kbase_jd_atom *katom;
334*4882a593Smuzhiyun
335*4882a593Smuzhiyun katom = jsctx_rb_peek_prio(kctx, js, prio);
336*4882a593Smuzhiyun if (katom)
337*4882a593Smuzhiyun return katom;
338*4882a593Smuzhiyun }
339*4882a593Smuzhiyun
340*4882a593Smuzhiyun return NULL;
341*4882a593Smuzhiyun }
342*4882a593Smuzhiyun
343*4882a593Smuzhiyun /**
344*4882a593Smuzhiyun * jsctx_rb_pull(): - Mark atom in list as running
345*4882a593Smuzhiyun * @kctx: Pointer to kbase context with ring buffer.
346*4882a593Smuzhiyun * @katom: Pointer to katom to pull.
347*4882a593Smuzhiyun *
348*4882a593Smuzhiyun * Mark an atom previously obtained from jsctx_rb_peek() as running.
349*4882a593Smuzhiyun *
350*4882a593Smuzhiyun * @katom must currently be at the head of the ring buffer.
351*4882a593Smuzhiyun */
352*4882a593Smuzhiyun static inline void
jsctx_rb_pull(struct kbase_context * kctx,struct kbase_jd_atom * katom)353*4882a593Smuzhiyun jsctx_rb_pull(struct kbase_context *kctx, struct kbase_jd_atom *katom)
354*4882a593Smuzhiyun {
355*4882a593Smuzhiyun int prio = katom->sched_priority;
356*4882a593Smuzhiyun unsigned int js = katom->slot_nr;
357*4882a593Smuzhiyun struct jsctx_queue *rb = &kctx->jsctx_queue[prio][js];
358*4882a593Smuzhiyun
359*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
360*4882a593Smuzhiyun
361*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Erasing atom %pK from runnable tree of kctx %pK\n",
362*4882a593Smuzhiyun (void *)katom, (void *)kctx);
363*4882a593Smuzhiyun
364*4882a593Smuzhiyun /* Atoms must be pulled in the correct order. */
365*4882a593Smuzhiyun WARN_ON(katom != jsctx_rb_peek_prio(kctx, js, prio));
366*4882a593Smuzhiyun
367*4882a593Smuzhiyun rb_erase(&katom->runnable_tree_node, &rb->runnable_tree);
368*4882a593Smuzhiyun }
369*4882a593Smuzhiyun
370*4882a593Smuzhiyun static void
jsctx_tree_add(struct kbase_context * kctx,struct kbase_jd_atom * katom)371*4882a593Smuzhiyun jsctx_tree_add(struct kbase_context *kctx, struct kbase_jd_atom *katom)
372*4882a593Smuzhiyun {
373*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
374*4882a593Smuzhiyun int prio = katom->sched_priority;
375*4882a593Smuzhiyun unsigned int js = katom->slot_nr;
376*4882a593Smuzhiyun struct jsctx_queue *queue = &kctx->jsctx_queue[prio][js];
377*4882a593Smuzhiyun struct rb_node **new = &(queue->runnable_tree.rb_node), *parent = NULL;
378*4882a593Smuzhiyun
379*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
380*4882a593Smuzhiyun
381*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Adding atom %pK to runnable tree of kctx %pK (s:%u)\n", (void *)katom,
382*4882a593Smuzhiyun (void *)kctx, js);
383*4882a593Smuzhiyun
384*4882a593Smuzhiyun while (*new) {
385*4882a593Smuzhiyun struct kbase_jd_atom *entry = container_of(*new,
386*4882a593Smuzhiyun struct kbase_jd_atom, runnable_tree_node);
387*4882a593Smuzhiyun
388*4882a593Smuzhiyun parent = *new;
389*4882a593Smuzhiyun if (kbase_jd_atom_is_younger(katom, entry))
390*4882a593Smuzhiyun new = &((*new)->rb_left);
391*4882a593Smuzhiyun else
392*4882a593Smuzhiyun new = &((*new)->rb_right);
393*4882a593Smuzhiyun }
394*4882a593Smuzhiyun
395*4882a593Smuzhiyun /* Add new node and rebalance tree. */
396*4882a593Smuzhiyun rb_link_node(&katom->runnable_tree_node, parent, new);
397*4882a593Smuzhiyun rb_insert_color(&katom->runnable_tree_node, &queue->runnable_tree);
398*4882a593Smuzhiyun
399*4882a593Smuzhiyun KBASE_TLSTREAM_TL_ATTRIB_ATOM_STATE(kbdev, katom, TL_ATOM_STATE_READY);
400*4882a593Smuzhiyun }
401*4882a593Smuzhiyun
402*4882a593Smuzhiyun /**
403*4882a593Smuzhiyun * jsctx_rb_unpull(): - Undo marking of atom in list as running
404*4882a593Smuzhiyun * @kctx: Pointer to kbase context with ring buffer.
405*4882a593Smuzhiyun * @katom: Pointer to katom to unpull.
406*4882a593Smuzhiyun *
407*4882a593Smuzhiyun * Undo jsctx_rb_pull() and put @katom back in the queue.
408*4882a593Smuzhiyun *
409*4882a593Smuzhiyun * jsctx_rb_unpull() must be called on atoms in the same order the atoms were
410*4882a593Smuzhiyun * pulled.
411*4882a593Smuzhiyun */
412*4882a593Smuzhiyun static inline void
jsctx_rb_unpull(struct kbase_context * kctx,struct kbase_jd_atom * katom)413*4882a593Smuzhiyun jsctx_rb_unpull(struct kbase_context *kctx, struct kbase_jd_atom *katom)
414*4882a593Smuzhiyun {
415*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
416*4882a593Smuzhiyun
417*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM(kctx->kbdev, JS_UNPULL_JOB, kctx, katom, katom->jc,
418*4882a593Smuzhiyun 0u);
419*4882a593Smuzhiyun
420*4882a593Smuzhiyun jsctx_tree_add(kctx, katom);
421*4882a593Smuzhiyun }
422*4882a593Smuzhiyun
423*4882a593Smuzhiyun static bool kbase_js_ctx_pullable(struct kbase_context *kctx, unsigned int js, bool is_scheduled);
424*4882a593Smuzhiyun static bool kbase_js_ctx_list_add_pullable_nolock(struct kbase_device *kbdev,
425*4882a593Smuzhiyun struct kbase_context *kctx, unsigned int js);
426*4882a593Smuzhiyun static bool kbase_js_ctx_list_add_unpullable_nolock(struct kbase_device *kbdev,
427*4882a593Smuzhiyun struct kbase_context *kctx, unsigned int js);
428*4882a593Smuzhiyun
429*4882a593Smuzhiyun typedef bool(katom_ordering_func)(const struct kbase_jd_atom *,
430*4882a593Smuzhiyun const struct kbase_jd_atom *);
431*4882a593Smuzhiyun
kbase_js_atom_runs_before(struct kbase_device * kbdev,const struct kbase_jd_atom * katom_a,const struct kbase_jd_atom * katom_b,const kbase_atom_ordering_flag_t order_flags)432*4882a593Smuzhiyun bool kbase_js_atom_runs_before(struct kbase_device *kbdev,
433*4882a593Smuzhiyun const struct kbase_jd_atom *katom_a,
434*4882a593Smuzhiyun const struct kbase_jd_atom *katom_b,
435*4882a593Smuzhiyun const kbase_atom_ordering_flag_t order_flags)
436*4882a593Smuzhiyun {
437*4882a593Smuzhiyun struct kbase_context *kctx_a = katom_a->kctx;
438*4882a593Smuzhiyun struct kbase_context *kctx_b = katom_b->kctx;
439*4882a593Smuzhiyun katom_ordering_func *samectxatomprio_ordering_func =
440*4882a593Smuzhiyun kbase_jd_atom_is_younger;
441*4882a593Smuzhiyun
442*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
443*4882a593Smuzhiyun
444*4882a593Smuzhiyun if (order_flags & KBASE_ATOM_ORDERING_FLAG_SEQNR)
445*4882a593Smuzhiyun samectxatomprio_ordering_func = kbase_jd_atom_is_earlier;
446*4882a593Smuzhiyun
447*4882a593Smuzhiyun /* It only makes sense to make this test for atoms on the same slot */
448*4882a593Smuzhiyun WARN_ON(katom_a->slot_nr != katom_b->slot_nr);
449*4882a593Smuzhiyun
450*4882a593Smuzhiyun if (kbdev->js_ctx_scheduling_mode ==
451*4882a593Smuzhiyun KBASE_JS_PROCESS_LOCAL_PRIORITY_MODE) {
452*4882a593Smuzhiyun /* In local priority mode, querying either way around for "a
453*4882a593Smuzhiyun * should run before b" and "b should run before a" should
454*4882a593Smuzhiyun * always be false when they're from different contexts
455*4882a593Smuzhiyun */
456*4882a593Smuzhiyun if (kctx_a != kctx_b)
457*4882a593Smuzhiyun return false;
458*4882a593Smuzhiyun } else {
459*4882a593Smuzhiyun /* In system priority mode, ordering is done first strictly by
460*4882a593Smuzhiyun * context priority, even when katom_b might be lower priority
461*4882a593Smuzhiyun * than katom_a. This is due to scheduling of contexts in order
462*4882a593Smuzhiyun * of highest priority first, regardless of whether the atoms
463*4882a593Smuzhiyun * for a particular slot from such contexts have the highest
464*4882a593Smuzhiyun * priority or not.
465*4882a593Smuzhiyun */
466*4882a593Smuzhiyun if (kctx_a != kctx_b) {
467*4882a593Smuzhiyun if (kctx_a->priority < kctx_b->priority)
468*4882a593Smuzhiyun return true;
469*4882a593Smuzhiyun if (kctx_a->priority > kctx_b->priority)
470*4882a593Smuzhiyun return false;
471*4882a593Smuzhiyun }
472*4882a593Smuzhiyun }
473*4882a593Smuzhiyun
474*4882a593Smuzhiyun /* For same contexts/contexts with the same context priority (in system
475*4882a593Smuzhiyun * priority mode), ordering is next done by atom priority
476*4882a593Smuzhiyun */
477*4882a593Smuzhiyun if (katom_a->sched_priority < katom_b->sched_priority)
478*4882a593Smuzhiyun return true;
479*4882a593Smuzhiyun if (katom_a->sched_priority > katom_b->sched_priority)
480*4882a593Smuzhiyun return false;
481*4882a593Smuzhiyun /* For atoms of same priority on the same kctx, they are
482*4882a593Smuzhiyun * ordered by seq_nr/age (dependent on caller)
483*4882a593Smuzhiyun */
484*4882a593Smuzhiyun if (kctx_a == kctx_b && samectxatomprio_ordering_func(katom_a, katom_b))
485*4882a593Smuzhiyun return true;
486*4882a593Smuzhiyun
487*4882a593Smuzhiyun return false;
488*4882a593Smuzhiyun }
489*4882a593Smuzhiyun
490*4882a593Smuzhiyun /*
491*4882a593Smuzhiyun * Functions private to KBase ('Protected' functions)
492*4882a593Smuzhiyun */
kbasep_js_devdata_init(struct kbase_device * const kbdev)493*4882a593Smuzhiyun int kbasep_js_devdata_init(struct kbase_device * const kbdev)
494*4882a593Smuzhiyun {
495*4882a593Smuzhiyun struct kbasep_js_device_data *jsdd;
496*4882a593Smuzhiyun int i, j;
497*4882a593Smuzhiyun
498*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
499*4882a593Smuzhiyun
500*4882a593Smuzhiyun jsdd = &kbdev->js_data;
501*4882a593Smuzhiyun
502*4882a593Smuzhiyun #ifdef CONFIG_MALI_BIFROST_DEBUG
503*4882a593Smuzhiyun /* Soft-stop will be disabled on a single context by default unless
504*4882a593Smuzhiyun * softstop_always is set
505*4882a593Smuzhiyun */
506*4882a593Smuzhiyun jsdd->softstop_always = false;
507*4882a593Smuzhiyun #endif /* CONFIG_MALI_BIFROST_DEBUG */
508*4882a593Smuzhiyun jsdd->nr_all_contexts_running = 0;
509*4882a593Smuzhiyun jsdd->nr_user_contexts_running = 0;
510*4882a593Smuzhiyun jsdd->nr_contexts_pullable = 0;
511*4882a593Smuzhiyun atomic_set(&jsdd->nr_contexts_runnable, 0);
512*4882a593Smuzhiyun /* No ctx allowed to submit */
513*4882a593Smuzhiyun jsdd->runpool_irq.submit_allowed = 0u;
514*4882a593Smuzhiyun memset(jsdd->runpool_irq.ctx_attr_ref_count, 0,
515*4882a593Smuzhiyun sizeof(jsdd->runpool_irq.ctx_attr_ref_count));
516*4882a593Smuzhiyun memset(jsdd->runpool_irq.slot_affinities, 0,
517*4882a593Smuzhiyun sizeof(jsdd->runpool_irq.slot_affinities));
518*4882a593Smuzhiyun memset(jsdd->runpool_irq.slot_affinity_refcount, 0,
519*4882a593Smuzhiyun sizeof(jsdd->runpool_irq.slot_affinity_refcount));
520*4882a593Smuzhiyun INIT_LIST_HEAD(&jsdd->suspended_soft_jobs_list);
521*4882a593Smuzhiyun
522*4882a593Smuzhiyun /* Config attributes */
523*4882a593Smuzhiyun jsdd->scheduling_period_ns = DEFAULT_JS_SCHEDULING_PERIOD_NS;
524*4882a593Smuzhiyun jsdd->soft_stop_ticks = DEFAULT_JS_SOFT_STOP_TICKS;
525*4882a593Smuzhiyun jsdd->soft_stop_ticks_cl = DEFAULT_JS_SOFT_STOP_TICKS_CL;
526*4882a593Smuzhiyun jsdd->hard_stop_ticks_ss = DEFAULT_JS_HARD_STOP_TICKS_SS;
527*4882a593Smuzhiyun jsdd->hard_stop_ticks_cl = DEFAULT_JS_HARD_STOP_TICKS_CL;
528*4882a593Smuzhiyun jsdd->hard_stop_ticks_dumping = DEFAULT_JS_HARD_STOP_TICKS_DUMPING;
529*4882a593Smuzhiyun jsdd->gpu_reset_ticks_ss = DEFAULT_JS_RESET_TICKS_SS;
530*4882a593Smuzhiyun jsdd->gpu_reset_ticks_cl = DEFAULT_JS_RESET_TICKS_CL;
531*4882a593Smuzhiyun
532*4882a593Smuzhiyun jsdd->gpu_reset_ticks_dumping = DEFAULT_JS_RESET_TICKS_DUMPING;
533*4882a593Smuzhiyun jsdd->ctx_timeslice_ns = DEFAULT_JS_CTX_TIMESLICE_NS;
534*4882a593Smuzhiyun atomic_set(&jsdd->soft_job_timeout_ms, DEFAULT_JS_SOFT_JOB_TIMEOUT);
535*4882a593Smuzhiyun jsdd->js_free_wait_time_ms = kbase_get_timeout_ms(kbdev, JM_DEFAULT_JS_FREE_TIMEOUT);
536*4882a593Smuzhiyun
537*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS Config Attribs: ");
538*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tscheduling_period_ns:%u",
539*4882a593Smuzhiyun jsdd->scheduling_period_ns);
540*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tsoft_stop_ticks:%u",
541*4882a593Smuzhiyun jsdd->soft_stop_ticks);
542*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tsoft_stop_ticks_cl:%u",
543*4882a593Smuzhiyun jsdd->soft_stop_ticks_cl);
544*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\thard_stop_ticks_ss:%u",
545*4882a593Smuzhiyun jsdd->hard_stop_ticks_ss);
546*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\thard_stop_ticks_cl:%u",
547*4882a593Smuzhiyun jsdd->hard_stop_ticks_cl);
548*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\thard_stop_ticks_dumping:%u",
549*4882a593Smuzhiyun jsdd->hard_stop_ticks_dumping);
550*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tgpu_reset_ticks_ss:%u",
551*4882a593Smuzhiyun jsdd->gpu_reset_ticks_ss);
552*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tgpu_reset_ticks_cl:%u",
553*4882a593Smuzhiyun jsdd->gpu_reset_ticks_cl);
554*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tgpu_reset_ticks_dumping:%u",
555*4882a593Smuzhiyun jsdd->gpu_reset_ticks_dumping);
556*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tctx_timeslice_ns:%u",
557*4882a593Smuzhiyun jsdd->ctx_timeslice_ns);
558*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tsoft_job_timeout:%i",
559*4882a593Smuzhiyun atomic_read(&jsdd->soft_job_timeout_ms));
560*4882a593Smuzhiyun dev_dbg(kbdev->dev, "\tjs_free_wait_time_ms:%u", jsdd->js_free_wait_time_ms);
561*4882a593Smuzhiyun
562*4882a593Smuzhiyun if (!(jsdd->soft_stop_ticks < jsdd->hard_stop_ticks_ss &&
563*4882a593Smuzhiyun jsdd->hard_stop_ticks_ss < jsdd->gpu_reset_ticks_ss &&
564*4882a593Smuzhiyun jsdd->soft_stop_ticks < jsdd->hard_stop_ticks_dumping &&
565*4882a593Smuzhiyun jsdd->hard_stop_ticks_dumping <
566*4882a593Smuzhiyun jsdd->gpu_reset_ticks_dumping)) {
567*4882a593Smuzhiyun dev_err(kbdev->dev, "Job scheduler timeouts invalid; soft/hard/reset tick counts should be in increasing order\n");
568*4882a593Smuzhiyun return -EINVAL;
569*4882a593Smuzhiyun }
570*4882a593Smuzhiyun
571*4882a593Smuzhiyun #if KBASE_DISABLE_SCHEDULING_SOFT_STOPS
572*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Job Scheduling Soft-stops disabled, ignoring value for soft_stop_ticks==%u at %uns per tick. Other soft-stops may still occur.",
573*4882a593Smuzhiyun jsdd->soft_stop_ticks,
574*4882a593Smuzhiyun jsdd->scheduling_period_ns);
575*4882a593Smuzhiyun #endif
576*4882a593Smuzhiyun #if KBASE_DISABLE_SCHEDULING_HARD_STOPS
577*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Job Scheduling Hard-stops disabled, ignoring values for hard_stop_ticks_ss==%d and hard_stop_ticks_dumping==%u at %uns per tick. Other hard-stops may still occur.",
578*4882a593Smuzhiyun jsdd->hard_stop_ticks_ss,
579*4882a593Smuzhiyun jsdd->hard_stop_ticks_dumping,
580*4882a593Smuzhiyun jsdd->scheduling_period_ns);
581*4882a593Smuzhiyun #endif
582*4882a593Smuzhiyun #if KBASE_DISABLE_SCHEDULING_SOFT_STOPS && KBASE_DISABLE_SCHEDULING_HARD_STOPS
583*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Note: The JS tick timer (if coded) will still be run, but do nothing.");
584*4882a593Smuzhiyun #endif
585*4882a593Smuzhiyun
586*4882a593Smuzhiyun for (i = 0; i < kbdev->gpu_props.num_job_slots; ++i)
587*4882a593Smuzhiyun jsdd->js_reqs[i] = core_reqs_from_jsn_features(
588*4882a593Smuzhiyun kbdev->gpu_props.props.raw_props.js_features[i]);
589*4882a593Smuzhiyun
590*4882a593Smuzhiyun /* On error, we could continue on: providing none of the below resources
591*4882a593Smuzhiyun * rely on the ones above
592*4882a593Smuzhiyun */
593*4882a593Smuzhiyun
594*4882a593Smuzhiyun mutex_init(&jsdd->runpool_mutex);
595*4882a593Smuzhiyun mutex_init(&jsdd->queue_mutex);
596*4882a593Smuzhiyun sema_init(&jsdd->schedule_sem, 1);
597*4882a593Smuzhiyun
598*4882a593Smuzhiyun for (i = 0; i < kbdev->gpu_props.num_job_slots; ++i) {
599*4882a593Smuzhiyun for (j = KBASE_JS_ATOM_SCHED_PRIO_FIRST; j < KBASE_JS_ATOM_SCHED_PRIO_COUNT; ++j) {
600*4882a593Smuzhiyun INIT_LIST_HEAD(&jsdd->ctx_list_pullable[i][j]);
601*4882a593Smuzhiyun INIT_LIST_HEAD(&jsdd->ctx_list_unpullable[i][j]);
602*4882a593Smuzhiyun }
603*4882a593Smuzhiyun }
604*4882a593Smuzhiyun
605*4882a593Smuzhiyun return 0;
606*4882a593Smuzhiyun }
607*4882a593Smuzhiyun
kbasep_js_devdata_halt(struct kbase_device * kbdev)608*4882a593Smuzhiyun void kbasep_js_devdata_halt(struct kbase_device *kbdev)
609*4882a593Smuzhiyun {
610*4882a593Smuzhiyun CSTD_UNUSED(kbdev);
611*4882a593Smuzhiyun }
612*4882a593Smuzhiyun
kbasep_js_devdata_term(struct kbase_device * kbdev)613*4882a593Smuzhiyun void kbasep_js_devdata_term(struct kbase_device *kbdev)
614*4882a593Smuzhiyun {
615*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
616*4882a593Smuzhiyun s8 zero_ctx_attr_ref_count[KBASEP_JS_CTX_ATTR_COUNT] = { 0, };
617*4882a593Smuzhiyun CSTD_UNUSED(js_devdata);
618*4882a593Smuzhiyun
619*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
620*4882a593Smuzhiyun
621*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
622*4882a593Smuzhiyun
623*4882a593Smuzhiyun /* The caller must de-register all contexts before calling this
624*4882a593Smuzhiyun */
625*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(js_devdata->nr_all_contexts_running == 0);
626*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(memcmp(
627*4882a593Smuzhiyun js_devdata->runpool_irq.ctx_attr_ref_count,
628*4882a593Smuzhiyun zero_ctx_attr_ref_count,
629*4882a593Smuzhiyun sizeof(zero_ctx_attr_ref_count)) == 0);
630*4882a593Smuzhiyun CSTD_UNUSED(zero_ctx_attr_ref_count);
631*4882a593Smuzhiyun }
632*4882a593Smuzhiyun
kbasep_js_kctx_init(struct kbase_context * const kctx)633*4882a593Smuzhiyun int kbasep_js_kctx_init(struct kbase_context *const kctx)
634*4882a593Smuzhiyun {
635*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
636*4882a593Smuzhiyun int i, j;
637*4882a593Smuzhiyun CSTD_UNUSED(js_kctx_info);
638*4882a593Smuzhiyun
639*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
640*4882a593Smuzhiyun
641*4882a593Smuzhiyun kbase_ctx_sched_init_ctx(kctx);
642*4882a593Smuzhiyun
643*4882a593Smuzhiyun for (i = 0; i < BASE_JM_MAX_NR_SLOTS; ++i)
644*4882a593Smuzhiyun INIT_LIST_HEAD(&kctx->jctx.sched_info.ctx.ctx_list_entry[i]);
645*4882a593Smuzhiyun
646*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
647*4882a593Smuzhiyun
648*4882a593Smuzhiyun kctx->slots_pullable = 0;
649*4882a593Smuzhiyun js_kctx_info->ctx.nr_jobs = 0;
650*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_SCHEDULED);
651*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_DYING);
652*4882a593Smuzhiyun memset(js_kctx_info->ctx.ctx_attr_ref_count, 0,
653*4882a593Smuzhiyun sizeof(js_kctx_info->ctx.ctx_attr_ref_count));
654*4882a593Smuzhiyun
655*4882a593Smuzhiyun /* Initially, the context is disabled from submission until the create
656*4882a593Smuzhiyun * flags are set
657*4882a593Smuzhiyun */
658*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_SUBMIT_DISABLED);
659*4882a593Smuzhiyun
660*4882a593Smuzhiyun /* On error, we could continue on: providing none of the below resources
661*4882a593Smuzhiyun * rely on the ones above
662*4882a593Smuzhiyun */
663*4882a593Smuzhiyun mutex_init(&js_kctx_info->ctx.jsctx_mutex);
664*4882a593Smuzhiyun
665*4882a593Smuzhiyun init_waitqueue_head(&js_kctx_info->ctx.is_scheduled_wait);
666*4882a593Smuzhiyun
667*4882a593Smuzhiyun for (i = KBASE_JS_ATOM_SCHED_PRIO_FIRST; i < KBASE_JS_ATOM_SCHED_PRIO_COUNT; i++) {
668*4882a593Smuzhiyun for (j = 0; j < BASE_JM_MAX_NR_SLOTS; j++) {
669*4882a593Smuzhiyun INIT_LIST_HEAD(&kctx->jsctx_queue[i][j].x_dep_head);
670*4882a593Smuzhiyun kctx->jsctx_queue[i][j].runnable_tree = RB_ROOT;
671*4882a593Smuzhiyun }
672*4882a593Smuzhiyun }
673*4882a593Smuzhiyun
674*4882a593Smuzhiyun return 0;
675*4882a593Smuzhiyun }
676*4882a593Smuzhiyun
kbasep_js_kctx_term(struct kbase_context * kctx)677*4882a593Smuzhiyun void kbasep_js_kctx_term(struct kbase_context *kctx)
678*4882a593Smuzhiyun {
679*4882a593Smuzhiyun struct kbase_device *kbdev;
680*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
681*4882a593Smuzhiyun unsigned int js;
682*4882a593Smuzhiyun bool update_ctx_count = false;
683*4882a593Smuzhiyun unsigned long flags;
684*4882a593Smuzhiyun CSTD_UNUSED(js_kctx_info);
685*4882a593Smuzhiyun
686*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
687*4882a593Smuzhiyun
688*4882a593Smuzhiyun kbdev = kctx->kbdev;
689*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
690*4882a593Smuzhiyun
691*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
692*4882a593Smuzhiyun
693*4882a593Smuzhiyun /* The caller must de-register all jobs before calling this */
694*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(!kbase_ctx_flag(kctx, KCTX_SCHEDULED));
695*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(js_kctx_info->ctx.nr_jobs == 0);
696*4882a593Smuzhiyun
697*4882a593Smuzhiyun mutex_lock(&kbdev->js_data.queue_mutex);
698*4882a593Smuzhiyun mutex_lock(&kctx->jctx.sched_info.ctx.jsctx_mutex);
699*4882a593Smuzhiyun
700*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
701*4882a593Smuzhiyun for (js = 0; js < kbdev->gpu_props.num_job_slots; js++)
702*4882a593Smuzhiyun list_del_init(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]);
703*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
704*4882a593Smuzhiyun
705*4882a593Smuzhiyun if (kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF)) {
706*4882a593Smuzhiyun WARN_ON(atomic_read(&kbdev->js_data.nr_contexts_runnable) <= 0);
707*4882a593Smuzhiyun atomic_dec(&kbdev->js_data.nr_contexts_runnable);
708*4882a593Smuzhiyun update_ctx_count = true;
709*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_RUNNABLE_REF);
710*4882a593Smuzhiyun }
711*4882a593Smuzhiyun
712*4882a593Smuzhiyun mutex_unlock(&kctx->jctx.sched_info.ctx.jsctx_mutex);
713*4882a593Smuzhiyun mutex_unlock(&kbdev->js_data.queue_mutex);
714*4882a593Smuzhiyun
715*4882a593Smuzhiyun if (update_ctx_count) {
716*4882a593Smuzhiyun mutex_lock(&kbdev->js_data.runpool_mutex);
717*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
718*4882a593Smuzhiyun mutex_unlock(&kbdev->js_data.runpool_mutex);
719*4882a593Smuzhiyun }
720*4882a593Smuzhiyun
721*4882a593Smuzhiyun kbase_ctx_sched_remove_ctx(kctx);
722*4882a593Smuzhiyun }
723*4882a593Smuzhiyun
724*4882a593Smuzhiyun /*
725*4882a593Smuzhiyun * Priority blocking management functions
726*4882a593Smuzhiyun */
727*4882a593Smuzhiyun
728*4882a593Smuzhiyun /* Should not normally use directly - use kbase_jsctx_slot_atom_pulled_dec() instead */
kbase_jsctx_slot_prio_blocked_clear(struct kbase_context * kctx,unsigned int js,int sched_prio)729*4882a593Smuzhiyun static void kbase_jsctx_slot_prio_blocked_clear(struct kbase_context *kctx, unsigned int js,
730*4882a593Smuzhiyun int sched_prio)
731*4882a593Smuzhiyun {
732*4882a593Smuzhiyun struct kbase_jsctx_slot_tracking *slot_tracking =
733*4882a593Smuzhiyun &kctx->slot_tracking[js];
734*4882a593Smuzhiyun
735*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
736*4882a593Smuzhiyun
737*4882a593Smuzhiyun slot_tracking->blocked &= ~(((kbase_js_prio_bitmap_t)1) << sched_prio);
738*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_SLOT_INFO(kctx->kbdev, JS_SLOT_PRIO_UNBLOCKED, kctx,
739*4882a593Smuzhiyun NULL, 0, js, (unsigned int)sched_prio);
740*4882a593Smuzhiyun }
741*4882a593Smuzhiyun
kbase_jsctx_slot_atoms_pulled(struct kbase_context * kctx,unsigned int js)742*4882a593Smuzhiyun static int kbase_jsctx_slot_atoms_pulled(struct kbase_context *kctx, unsigned int js)
743*4882a593Smuzhiyun {
744*4882a593Smuzhiyun return atomic_read(&kctx->slot_tracking[js].atoms_pulled);
745*4882a593Smuzhiyun }
746*4882a593Smuzhiyun
747*4882a593Smuzhiyun /*
748*4882a593Smuzhiyun * A priority level on a slot is blocked when:
749*4882a593Smuzhiyun * - that priority level is blocked
750*4882a593Smuzhiyun * - or, any higher priority level is blocked
751*4882a593Smuzhiyun */
kbase_jsctx_slot_prio_is_blocked(struct kbase_context * kctx,unsigned int js,int sched_prio)752*4882a593Smuzhiyun static bool kbase_jsctx_slot_prio_is_blocked(struct kbase_context *kctx, unsigned int js,
753*4882a593Smuzhiyun int sched_prio)
754*4882a593Smuzhiyun {
755*4882a593Smuzhiyun struct kbase_jsctx_slot_tracking *slot_tracking =
756*4882a593Smuzhiyun &kctx->slot_tracking[js];
757*4882a593Smuzhiyun kbase_js_prio_bitmap_t prio_bit, higher_prios_mask;
758*4882a593Smuzhiyun
759*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
760*4882a593Smuzhiyun
761*4882a593Smuzhiyun /* done in two separate shifts to prevent future undefined behavior
762*4882a593Smuzhiyun * should the number of priority levels == (bit width of the type)
763*4882a593Smuzhiyun */
764*4882a593Smuzhiyun prio_bit = (((kbase_js_prio_bitmap_t)1) << sched_prio);
765*4882a593Smuzhiyun /* all bits of sched_prio or higher, with sched_prio = 0 being the
766*4882a593Smuzhiyun * highest priority
767*4882a593Smuzhiyun */
768*4882a593Smuzhiyun higher_prios_mask = (prio_bit << 1) - 1u;
769*4882a593Smuzhiyun return (slot_tracking->blocked & higher_prios_mask) != 0u;
770*4882a593Smuzhiyun }
771*4882a593Smuzhiyun
772*4882a593Smuzhiyun /**
773*4882a593Smuzhiyun * kbase_jsctx_slot_atom_pulled_inc - Increase counts of atoms that have being
774*4882a593Smuzhiyun * pulled for a slot from a ctx, based on
775*4882a593Smuzhiyun * this atom
776*4882a593Smuzhiyun * @kctx: kbase context
777*4882a593Smuzhiyun * @katom: atom pulled
778*4882a593Smuzhiyun *
779*4882a593Smuzhiyun * Manages counts of atoms pulled (including per-priority-level counts), for
780*4882a593Smuzhiyun * later determining when a ctx can become unblocked on a slot.
781*4882a593Smuzhiyun *
782*4882a593Smuzhiyun * Once a slot has been blocked at @katom's priority level, it should not be
783*4882a593Smuzhiyun * pulled from, hence this function should not be called in that case.
784*4882a593Smuzhiyun *
785*4882a593Smuzhiyun * The return value is to aid tracking of when @kctx becomes runnable.
786*4882a593Smuzhiyun *
787*4882a593Smuzhiyun * Return: new total count of atoms pulled from all slots on @kctx
788*4882a593Smuzhiyun */
kbase_jsctx_slot_atom_pulled_inc(struct kbase_context * kctx,const struct kbase_jd_atom * katom)789*4882a593Smuzhiyun static int kbase_jsctx_slot_atom_pulled_inc(struct kbase_context *kctx,
790*4882a593Smuzhiyun const struct kbase_jd_atom *katom)
791*4882a593Smuzhiyun {
792*4882a593Smuzhiyun unsigned int js = katom->slot_nr;
793*4882a593Smuzhiyun int sched_prio = katom->sched_priority;
794*4882a593Smuzhiyun struct kbase_jsctx_slot_tracking *slot_tracking =
795*4882a593Smuzhiyun &kctx->slot_tracking[js];
796*4882a593Smuzhiyun int nr_atoms_pulled;
797*4882a593Smuzhiyun
798*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
799*4882a593Smuzhiyun
800*4882a593Smuzhiyun WARN(kbase_jsctx_slot_prio_is_blocked(kctx, js, sched_prio),
801*4882a593Smuzhiyun "Should not have pulled atoms for slot %u from a context that is blocked at priority %d or higher",
802*4882a593Smuzhiyun js, sched_prio);
803*4882a593Smuzhiyun
804*4882a593Smuzhiyun nr_atoms_pulled = atomic_inc_return(&kctx->atoms_pulled_all_slots);
805*4882a593Smuzhiyun atomic_inc(&slot_tracking->atoms_pulled);
806*4882a593Smuzhiyun slot_tracking->atoms_pulled_pri[sched_prio]++;
807*4882a593Smuzhiyun
808*4882a593Smuzhiyun return nr_atoms_pulled;
809*4882a593Smuzhiyun }
810*4882a593Smuzhiyun
811*4882a593Smuzhiyun /**
812*4882a593Smuzhiyun * kbase_jsctx_slot_atom_pulled_dec- Decrease counts of atoms that have being
813*4882a593Smuzhiyun * pulled for a slot from a ctx, and
814*4882a593Smuzhiyun * re-evaluate whether a context is blocked
815*4882a593Smuzhiyun * on this slot
816*4882a593Smuzhiyun * @kctx: kbase context
817*4882a593Smuzhiyun * @katom: atom that has just been removed from a job slot
818*4882a593Smuzhiyun *
819*4882a593Smuzhiyun * @kctx can become unblocked on a slot for a priority level when it no longer
820*4882a593Smuzhiyun * has any pulled atoms at that priority level on that slot, and all higher
821*4882a593Smuzhiyun * (numerically lower) priority levels are also unblocked @kctx on that
822*4882a593Smuzhiyun * slot. The latter condition is to retain priority ordering within @kctx.
823*4882a593Smuzhiyun *
824*4882a593Smuzhiyun * Return: true if the slot was previously blocked but has now become unblocked
825*4882a593Smuzhiyun * at @katom's priority level, false otherwise.
826*4882a593Smuzhiyun */
kbase_jsctx_slot_atom_pulled_dec(struct kbase_context * kctx,const struct kbase_jd_atom * katom)827*4882a593Smuzhiyun static bool kbase_jsctx_slot_atom_pulled_dec(struct kbase_context *kctx,
828*4882a593Smuzhiyun const struct kbase_jd_atom *katom)
829*4882a593Smuzhiyun {
830*4882a593Smuzhiyun unsigned int js = katom->slot_nr;
831*4882a593Smuzhiyun int sched_prio = katom->sched_priority;
832*4882a593Smuzhiyun int atoms_pulled_pri;
833*4882a593Smuzhiyun struct kbase_jsctx_slot_tracking *slot_tracking =
834*4882a593Smuzhiyun &kctx->slot_tracking[js];
835*4882a593Smuzhiyun bool slot_prio_became_unblocked = false;
836*4882a593Smuzhiyun
837*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
838*4882a593Smuzhiyun
839*4882a593Smuzhiyun atomic_dec(&kctx->atoms_pulled_all_slots);
840*4882a593Smuzhiyun atomic_dec(&slot_tracking->atoms_pulled);
841*4882a593Smuzhiyun
842*4882a593Smuzhiyun atoms_pulled_pri = --(slot_tracking->atoms_pulled_pri[sched_prio]);
843*4882a593Smuzhiyun
844*4882a593Smuzhiyun /* We can safely clear this priority level's blocked status even if
845*4882a593Smuzhiyun * higher priority levels are still blocked: a subsequent query to
846*4882a593Smuzhiyun * kbase_jsctx_slot_prio_is_blocked() will still return true
847*4882a593Smuzhiyun */
848*4882a593Smuzhiyun if (!atoms_pulled_pri &&
849*4882a593Smuzhiyun kbase_jsctx_slot_prio_is_blocked(kctx, js, sched_prio)) {
850*4882a593Smuzhiyun kbase_jsctx_slot_prio_blocked_clear(kctx, js, sched_prio);
851*4882a593Smuzhiyun
852*4882a593Smuzhiyun if (!kbase_jsctx_slot_prio_is_blocked(kctx, js, sched_prio))
853*4882a593Smuzhiyun slot_prio_became_unblocked = true;
854*4882a593Smuzhiyun }
855*4882a593Smuzhiyun
856*4882a593Smuzhiyun if (slot_prio_became_unblocked)
857*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_SLOT_INFO(kctx->kbdev,
858*4882a593Smuzhiyun JS_SLOT_PRIO_AND_HIGHER_UNBLOCKED,
859*4882a593Smuzhiyun kctx, katom, katom->jc, js,
860*4882a593Smuzhiyun (unsigned int)sched_prio);
861*4882a593Smuzhiyun
862*4882a593Smuzhiyun return slot_prio_became_unblocked;
863*4882a593Smuzhiyun }
864*4882a593Smuzhiyun
865*4882a593Smuzhiyun /**
866*4882a593Smuzhiyun * kbase_js_ctx_list_add_pullable_nolock - Variant of
867*4882a593Smuzhiyun * kbase_jd_ctx_list_add_pullable()
868*4882a593Smuzhiyun * where the caller must hold
869*4882a593Smuzhiyun * hwaccess_lock
870*4882a593Smuzhiyun * @kbdev: Device pointer
871*4882a593Smuzhiyun * @kctx: Context to add to queue
872*4882a593Smuzhiyun * @js: Job slot to use
873*4882a593Smuzhiyun *
874*4882a593Smuzhiyun * Caller must hold hwaccess_lock
875*4882a593Smuzhiyun *
876*4882a593Smuzhiyun * Return: true if caller should call kbase_backend_ctx_count_changed()
877*4882a593Smuzhiyun */
kbase_js_ctx_list_add_pullable_nolock(struct kbase_device * kbdev,struct kbase_context * kctx,unsigned int js)878*4882a593Smuzhiyun static bool kbase_js_ctx_list_add_pullable_nolock(struct kbase_device *kbdev,
879*4882a593Smuzhiyun struct kbase_context *kctx, unsigned int js)
880*4882a593Smuzhiyun {
881*4882a593Smuzhiyun bool ret = false;
882*4882a593Smuzhiyun
883*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
884*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Add pullable tail kctx %pK (s:%u)\n", (void *)kctx, js);
885*4882a593Smuzhiyun
886*4882a593Smuzhiyun if (!list_empty(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]))
887*4882a593Smuzhiyun list_del_init(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]);
888*4882a593Smuzhiyun
889*4882a593Smuzhiyun list_add_tail(&kctx->jctx.sched_info.ctx.ctx_list_entry[js],
890*4882a593Smuzhiyun &kbdev->js_data.ctx_list_pullable[js][kctx->priority]);
891*4882a593Smuzhiyun
892*4882a593Smuzhiyun if (!kctx->slots_pullable) {
893*4882a593Smuzhiyun kbdev->js_data.nr_contexts_pullable++;
894*4882a593Smuzhiyun ret = true;
895*4882a593Smuzhiyun if (!kbase_jsctx_atoms_pulled(kctx)) {
896*4882a593Smuzhiyun WARN_ON(kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF));
897*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_RUNNABLE_REF);
898*4882a593Smuzhiyun atomic_inc(&kbdev->js_data.nr_contexts_runnable);
899*4882a593Smuzhiyun }
900*4882a593Smuzhiyun }
901*4882a593Smuzhiyun kctx->slots_pullable |= (1 << js);
902*4882a593Smuzhiyun
903*4882a593Smuzhiyun return ret;
904*4882a593Smuzhiyun }
905*4882a593Smuzhiyun
906*4882a593Smuzhiyun /**
907*4882a593Smuzhiyun * kbase_js_ctx_list_add_pullable_head_nolock - Variant of
908*4882a593Smuzhiyun * kbase_js_ctx_list_add_pullable_head()
909*4882a593Smuzhiyun * where the caller must hold
910*4882a593Smuzhiyun * hwaccess_lock
911*4882a593Smuzhiyun * @kbdev: Device pointer
912*4882a593Smuzhiyun * @kctx: Context to add to queue
913*4882a593Smuzhiyun * @js: Job slot to use
914*4882a593Smuzhiyun *
915*4882a593Smuzhiyun * Caller must hold hwaccess_lock
916*4882a593Smuzhiyun *
917*4882a593Smuzhiyun * Return: true if caller should call kbase_backend_ctx_count_changed()
918*4882a593Smuzhiyun */
kbase_js_ctx_list_add_pullable_head_nolock(struct kbase_device * kbdev,struct kbase_context * kctx,unsigned int js)919*4882a593Smuzhiyun static bool kbase_js_ctx_list_add_pullable_head_nolock(struct kbase_device *kbdev,
920*4882a593Smuzhiyun struct kbase_context *kctx, unsigned int js)
921*4882a593Smuzhiyun {
922*4882a593Smuzhiyun bool ret = false;
923*4882a593Smuzhiyun
924*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
925*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Add pullable head kctx %pK (s:%u)\n", (void *)kctx, js);
926*4882a593Smuzhiyun
927*4882a593Smuzhiyun if (!list_empty(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]))
928*4882a593Smuzhiyun list_del_init(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]);
929*4882a593Smuzhiyun
930*4882a593Smuzhiyun list_add(&kctx->jctx.sched_info.ctx.ctx_list_entry[js],
931*4882a593Smuzhiyun &kbdev->js_data.ctx_list_pullable[js][kctx->priority]);
932*4882a593Smuzhiyun
933*4882a593Smuzhiyun if (!kctx->slots_pullable) {
934*4882a593Smuzhiyun kbdev->js_data.nr_contexts_pullable++;
935*4882a593Smuzhiyun ret = true;
936*4882a593Smuzhiyun if (!kbase_jsctx_atoms_pulled(kctx)) {
937*4882a593Smuzhiyun WARN_ON(kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF));
938*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_RUNNABLE_REF);
939*4882a593Smuzhiyun atomic_inc(&kbdev->js_data.nr_contexts_runnable);
940*4882a593Smuzhiyun }
941*4882a593Smuzhiyun }
942*4882a593Smuzhiyun kctx->slots_pullable |= (1 << js);
943*4882a593Smuzhiyun
944*4882a593Smuzhiyun return ret;
945*4882a593Smuzhiyun }
946*4882a593Smuzhiyun
947*4882a593Smuzhiyun /**
948*4882a593Smuzhiyun * kbase_js_ctx_list_add_pullable_head - Add context to the head of the
949*4882a593Smuzhiyun * per-slot pullable context queue
950*4882a593Smuzhiyun * @kbdev: Device pointer
951*4882a593Smuzhiyun * @kctx: Context to add to queue
952*4882a593Smuzhiyun * @js: Job slot to use
953*4882a593Smuzhiyun *
954*4882a593Smuzhiyun * If the context is on either the pullable or unpullable queues, then it is
955*4882a593Smuzhiyun * removed before being added to the head.
956*4882a593Smuzhiyun *
957*4882a593Smuzhiyun * This function should be used when a context has been scheduled, but no jobs
958*4882a593Smuzhiyun * can currently be pulled from it.
959*4882a593Smuzhiyun *
960*4882a593Smuzhiyun * Return: true if caller should call kbase_backend_ctx_count_changed()
961*4882a593Smuzhiyun */
kbase_js_ctx_list_add_pullable_head(struct kbase_device * kbdev,struct kbase_context * kctx,unsigned int js)962*4882a593Smuzhiyun static bool kbase_js_ctx_list_add_pullable_head(struct kbase_device *kbdev,
963*4882a593Smuzhiyun struct kbase_context *kctx, unsigned int js)
964*4882a593Smuzhiyun {
965*4882a593Smuzhiyun bool ret;
966*4882a593Smuzhiyun unsigned long flags;
967*4882a593Smuzhiyun
968*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
969*4882a593Smuzhiyun ret = kbase_js_ctx_list_add_pullable_head_nolock(kbdev, kctx, js);
970*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
971*4882a593Smuzhiyun
972*4882a593Smuzhiyun return ret;
973*4882a593Smuzhiyun }
974*4882a593Smuzhiyun
975*4882a593Smuzhiyun /**
976*4882a593Smuzhiyun * kbase_js_ctx_list_add_unpullable_nolock - Add context to the tail of the
977*4882a593Smuzhiyun * per-slot unpullable context queue
978*4882a593Smuzhiyun * @kbdev: Device pointer
979*4882a593Smuzhiyun * @kctx: Context to add to queue
980*4882a593Smuzhiyun * @js: Job slot to use
981*4882a593Smuzhiyun *
982*4882a593Smuzhiyun * The context must already be on the per-slot pullable queue. It will be
983*4882a593Smuzhiyun * removed from the pullable queue before being added to the unpullable queue.
984*4882a593Smuzhiyun *
985*4882a593Smuzhiyun * This function should be used when a context has been pulled from, and there
986*4882a593Smuzhiyun * are no jobs remaining on the specified slot.
987*4882a593Smuzhiyun *
988*4882a593Smuzhiyun * Caller must hold hwaccess_lock
989*4882a593Smuzhiyun *
990*4882a593Smuzhiyun * Return: true if caller should call kbase_backend_ctx_count_changed()
991*4882a593Smuzhiyun */
kbase_js_ctx_list_add_unpullable_nolock(struct kbase_device * kbdev,struct kbase_context * kctx,unsigned int js)992*4882a593Smuzhiyun static bool kbase_js_ctx_list_add_unpullable_nolock(struct kbase_device *kbdev,
993*4882a593Smuzhiyun struct kbase_context *kctx, unsigned int js)
994*4882a593Smuzhiyun {
995*4882a593Smuzhiyun bool ret = false;
996*4882a593Smuzhiyun
997*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
998*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Add unpullable tail kctx %pK (s:%u)\n", (void *)kctx, js);
999*4882a593Smuzhiyun
1000*4882a593Smuzhiyun list_move_tail(&kctx->jctx.sched_info.ctx.ctx_list_entry[js],
1001*4882a593Smuzhiyun &kbdev->js_data.ctx_list_unpullable[js][kctx->priority]);
1002*4882a593Smuzhiyun
1003*4882a593Smuzhiyun if (kctx->slots_pullable == (1 << js)) {
1004*4882a593Smuzhiyun kbdev->js_data.nr_contexts_pullable--;
1005*4882a593Smuzhiyun ret = true;
1006*4882a593Smuzhiyun if (!kbase_jsctx_atoms_pulled(kctx)) {
1007*4882a593Smuzhiyun WARN_ON(!kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF));
1008*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_RUNNABLE_REF);
1009*4882a593Smuzhiyun atomic_dec(&kbdev->js_data.nr_contexts_runnable);
1010*4882a593Smuzhiyun }
1011*4882a593Smuzhiyun }
1012*4882a593Smuzhiyun kctx->slots_pullable &= ~(1 << js);
1013*4882a593Smuzhiyun
1014*4882a593Smuzhiyun return ret;
1015*4882a593Smuzhiyun }
1016*4882a593Smuzhiyun
1017*4882a593Smuzhiyun /**
1018*4882a593Smuzhiyun * kbase_js_ctx_list_remove_nolock - Remove context from the per-slot pullable
1019*4882a593Smuzhiyun * or unpullable context queues
1020*4882a593Smuzhiyun * @kbdev: Device pointer
1021*4882a593Smuzhiyun * @kctx: Context to remove from queue
1022*4882a593Smuzhiyun * @js: Job slot to use
1023*4882a593Smuzhiyun *
1024*4882a593Smuzhiyun * The context must already be on one of the queues.
1025*4882a593Smuzhiyun *
1026*4882a593Smuzhiyun * This function should be used when a context has no jobs on the GPU, and no
1027*4882a593Smuzhiyun * jobs remaining for the specified slot.
1028*4882a593Smuzhiyun *
1029*4882a593Smuzhiyun * Caller must hold hwaccess_lock
1030*4882a593Smuzhiyun *
1031*4882a593Smuzhiyun * Return: true if caller should call kbase_backend_ctx_count_changed()
1032*4882a593Smuzhiyun */
kbase_js_ctx_list_remove_nolock(struct kbase_device * kbdev,struct kbase_context * kctx,unsigned int js)1033*4882a593Smuzhiyun static bool kbase_js_ctx_list_remove_nolock(struct kbase_device *kbdev, struct kbase_context *kctx,
1034*4882a593Smuzhiyun unsigned int js)
1035*4882a593Smuzhiyun {
1036*4882a593Smuzhiyun bool ret = false;
1037*4882a593Smuzhiyun
1038*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
1039*4882a593Smuzhiyun
1040*4882a593Smuzhiyun WARN_ON(list_empty(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]));
1041*4882a593Smuzhiyun
1042*4882a593Smuzhiyun list_del_init(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]);
1043*4882a593Smuzhiyun
1044*4882a593Smuzhiyun if (kctx->slots_pullable == (1 << js)) {
1045*4882a593Smuzhiyun kbdev->js_data.nr_contexts_pullable--;
1046*4882a593Smuzhiyun ret = true;
1047*4882a593Smuzhiyun if (!kbase_jsctx_atoms_pulled(kctx)) {
1048*4882a593Smuzhiyun WARN_ON(!kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF));
1049*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_RUNNABLE_REF);
1050*4882a593Smuzhiyun atomic_dec(&kbdev->js_data.nr_contexts_runnable);
1051*4882a593Smuzhiyun }
1052*4882a593Smuzhiyun }
1053*4882a593Smuzhiyun kctx->slots_pullable &= ~(1 << js);
1054*4882a593Smuzhiyun
1055*4882a593Smuzhiyun return ret;
1056*4882a593Smuzhiyun }
1057*4882a593Smuzhiyun
1058*4882a593Smuzhiyun /**
1059*4882a593Smuzhiyun * kbase_js_ctx_list_pop_head_nolock - Variant of kbase_js_ctx_list_pop_head()
1060*4882a593Smuzhiyun * where the caller must hold
1061*4882a593Smuzhiyun * hwaccess_lock
1062*4882a593Smuzhiyun * @kbdev: Device pointer
1063*4882a593Smuzhiyun * @js: Job slot to use
1064*4882a593Smuzhiyun *
1065*4882a593Smuzhiyun * Caller must hold hwaccess_lock
1066*4882a593Smuzhiyun *
1067*4882a593Smuzhiyun * Return: Context to use for specified slot.
1068*4882a593Smuzhiyun * NULL if no contexts present for specified slot
1069*4882a593Smuzhiyun */
kbase_js_ctx_list_pop_head_nolock(struct kbase_device * kbdev,unsigned int js)1070*4882a593Smuzhiyun static struct kbase_context *kbase_js_ctx_list_pop_head_nolock(struct kbase_device *kbdev,
1071*4882a593Smuzhiyun unsigned int js)
1072*4882a593Smuzhiyun {
1073*4882a593Smuzhiyun struct kbase_context *kctx;
1074*4882a593Smuzhiyun int i;
1075*4882a593Smuzhiyun
1076*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
1077*4882a593Smuzhiyun
1078*4882a593Smuzhiyun for (i = KBASE_JS_ATOM_SCHED_PRIO_FIRST; i < KBASE_JS_ATOM_SCHED_PRIO_COUNT; i++) {
1079*4882a593Smuzhiyun if (list_empty(&kbdev->js_data.ctx_list_pullable[js][i]))
1080*4882a593Smuzhiyun continue;
1081*4882a593Smuzhiyun
1082*4882a593Smuzhiyun kctx = list_entry(kbdev->js_data.ctx_list_pullable[js][i].next,
1083*4882a593Smuzhiyun struct kbase_context,
1084*4882a593Smuzhiyun jctx.sched_info.ctx.ctx_list_entry[js]);
1085*4882a593Smuzhiyun
1086*4882a593Smuzhiyun list_del_init(&kctx->jctx.sched_info.ctx.ctx_list_entry[js]);
1087*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Popped %pK from the pullable queue (s:%u)\n", (void *)kctx,
1088*4882a593Smuzhiyun js);
1089*4882a593Smuzhiyun return kctx;
1090*4882a593Smuzhiyun }
1091*4882a593Smuzhiyun return NULL;
1092*4882a593Smuzhiyun }
1093*4882a593Smuzhiyun
1094*4882a593Smuzhiyun /**
1095*4882a593Smuzhiyun * kbase_js_ctx_list_pop_head - Pop the head context off the per-slot pullable
1096*4882a593Smuzhiyun * queue.
1097*4882a593Smuzhiyun * @kbdev: Device pointer
1098*4882a593Smuzhiyun * @js: Job slot to use
1099*4882a593Smuzhiyun *
1100*4882a593Smuzhiyun * Return: Context to use for specified slot.
1101*4882a593Smuzhiyun * NULL if no contexts present for specified slot
1102*4882a593Smuzhiyun */
kbase_js_ctx_list_pop_head(struct kbase_device * kbdev,unsigned int js)1103*4882a593Smuzhiyun static struct kbase_context *kbase_js_ctx_list_pop_head(struct kbase_device *kbdev, unsigned int js)
1104*4882a593Smuzhiyun {
1105*4882a593Smuzhiyun struct kbase_context *kctx;
1106*4882a593Smuzhiyun unsigned long flags;
1107*4882a593Smuzhiyun
1108*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
1109*4882a593Smuzhiyun kctx = kbase_js_ctx_list_pop_head_nolock(kbdev, js);
1110*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1111*4882a593Smuzhiyun
1112*4882a593Smuzhiyun return kctx;
1113*4882a593Smuzhiyun }
1114*4882a593Smuzhiyun
1115*4882a593Smuzhiyun /**
1116*4882a593Smuzhiyun * kbase_js_ctx_pullable - Return if a context can be pulled from on the
1117*4882a593Smuzhiyun * specified slot
1118*4882a593Smuzhiyun * @kctx: Context pointer
1119*4882a593Smuzhiyun * @js: Job slot to use
1120*4882a593Smuzhiyun * @is_scheduled: true if the context is currently scheduled
1121*4882a593Smuzhiyun *
1122*4882a593Smuzhiyun * Caller must hold hwaccess_lock
1123*4882a593Smuzhiyun *
1124*4882a593Smuzhiyun * Return: true if context can be pulled from on specified slot
1125*4882a593Smuzhiyun * false otherwise
1126*4882a593Smuzhiyun */
kbase_js_ctx_pullable(struct kbase_context * kctx,unsigned int js,bool is_scheduled)1127*4882a593Smuzhiyun static bool kbase_js_ctx_pullable(struct kbase_context *kctx, unsigned int js, bool is_scheduled)
1128*4882a593Smuzhiyun {
1129*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
1130*4882a593Smuzhiyun struct kbase_jd_atom *katom;
1131*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
1132*4882a593Smuzhiyun
1133*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
1134*4882a593Smuzhiyun
1135*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
1136*4882a593Smuzhiyun
1137*4882a593Smuzhiyun if (is_scheduled) {
1138*4882a593Smuzhiyun if (!kbasep_js_is_submit_allowed(js_devdata, kctx)) {
1139*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: No submit allowed for kctx %pK\n",
1140*4882a593Smuzhiyun (void *)kctx);
1141*4882a593Smuzhiyun return false;
1142*4882a593Smuzhiyun }
1143*4882a593Smuzhiyun }
1144*4882a593Smuzhiyun katom = jsctx_rb_peek(kctx, js);
1145*4882a593Smuzhiyun if (!katom) {
1146*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: No pullable atom in kctx %pK (s:%u)\n", (void *)kctx, js);
1147*4882a593Smuzhiyun return false; /* No pullable atoms */
1148*4882a593Smuzhiyun }
1149*4882a593Smuzhiyun if (kbase_jsctx_slot_prio_is_blocked(kctx, js, katom->sched_priority)) {
1150*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_SLOT_INFO(
1151*4882a593Smuzhiyun kctx->kbdev, JS_SLOT_PRIO_IS_BLOCKED, kctx, katom,
1152*4882a593Smuzhiyun katom->jc, js, (unsigned int)katom->sched_priority);
1153*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1154*4882a593Smuzhiyun "JS: kctx %pK is blocked from submitting atoms at priority %d and lower (s:%u)\n",
1155*4882a593Smuzhiyun (void *)kctx, katom->sched_priority, js);
1156*4882a593Smuzhiyun return false;
1157*4882a593Smuzhiyun }
1158*4882a593Smuzhiyun if (atomic_read(&katom->blocked)) {
1159*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: Atom %pK is blocked in js_ctx_pullable\n",
1160*4882a593Smuzhiyun (void *)katom);
1161*4882a593Smuzhiyun return false; /* next atom blocked */
1162*4882a593Smuzhiyun }
1163*4882a593Smuzhiyun if (kbase_js_atom_blocked_on_x_dep(katom)) {
1164*4882a593Smuzhiyun if (katom->x_pre_dep->gpu_rb_state ==
1165*4882a593Smuzhiyun KBASE_ATOM_GPU_RB_NOT_IN_SLOT_RB ||
1166*4882a593Smuzhiyun katom->x_pre_dep->will_fail_event_code) {
1167*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1168*4882a593Smuzhiyun "JS: X pre-dep %pK is not present in slot FIFO or will fail\n",
1169*4882a593Smuzhiyun (void *)katom->x_pre_dep);
1170*4882a593Smuzhiyun return false;
1171*4882a593Smuzhiyun }
1172*4882a593Smuzhiyun if ((katom->atom_flags & KBASE_KATOM_FLAG_FAIL_BLOCKER) &&
1173*4882a593Smuzhiyun kbase_backend_nr_atoms_on_slot(kctx->kbdev, js)) {
1174*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1175*4882a593Smuzhiyun "JS: Atom %pK has cross-slot fail dependency and atoms on slot (s:%u)\n",
1176*4882a593Smuzhiyun (void *)katom, js);
1177*4882a593Smuzhiyun return false;
1178*4882a593Smuzhiyun }
1179*4882a593Smuzhiyun }
1180*4882a593Smuzhiyun
1181*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: Atom %pK is pullable in kctx %pK (s:%u)\n", (void *)katom,
1182*4882a593Smuzhiyun (void *)kctx, js);
1183*4882a593Smuzhiyun
1184*4882a593Smuzhiyun return true;
1185*4882a593Smuzhiyun }
1186*4882a593Smuzhiyun
kbase_js_dep_validate(struct kbase_context * kctx,struct kbase_jd_atom * katom)1187*4882a593Smuzhiyun static bool kbase_js_dep_validate(struct kbase_context *kctx,
1188*4882a593Smuzhiyun struct kbase_jd_atom *katom)
1189*4882a593Smuzhiyun {
1190*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
1191*4882a593Smuzhiyun bool ret = true;
1192*4882a593Smuzhiyun bool has_dep = false, has_x_dep = false;
1193*4882a593Smuzhiyun unsigned int js = kbase_js_get_slot(kbdev, katom);
1194*4882a593Smuzhiyun int prio = katom->sched_priority;
1195*4882a593Smuzhiyun int i;
1196*4882a593Smuzhiyun
1197*4882a593Smuzhiyun for (i = 0; i < 2; i++) {
1198*4882a593Smuzhiyun struct kbase_jd_atom *dep_atom = katom->dep[i].atom;
1199*4882a593Smuzhiyun
1200*4882a593Smuzhiyun if (dep_atom) {
1201*4882a593Smuzhiyun unsigned int dep_js = kbase_js_get_slot(kbdev, dep_atom);
1202*4882a593Smuzhiyun int dep_prio = dep_atom->sched_priority;
1203*4882a593Smuzhiyun
1204*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1205*4882a593Smuzhiyun "Checking dep %d of atom %pK (s:%d) on %pK (s:%d)\n",
1206*4882a593Smuzhiyun i, (void *)katom, js, (void *)dep_atom, dep_js);
1207*4882a593Smuzhiyun
1208*4882a593Smuzhiyun /* Dependent atom must already have been submitted */
1209*4882a593Smuzhiyun if (!(dep_atom->atom_flags &
1210*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_TREE)) {
1211*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1212*4882a593Smuzhiyun "Blocker not submitted yet\n");
1213*4882a593Smuzhiyun ret = false;
1214*4882a593Smuzhiyun break;
1215*4882a593Smuzhiyun }
1216*4882a593Smuzhiyun
1217*4882a593Smuzhiyun /* Dependencies with different priorities can't
1218*4882a593Smuzhiyun * be represented in the ringbuffer
1219*4882a593Smuzhiyun */
1220*4882a593Smuzhiyun if (prio != dep_prio) {
1221*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1222*4882a593Smuzhiyun "Different atom priorities\n");
1223*4882a593Smuzhiyun ret = false;
1224*4882a593Smuzhiyun break;
1225*4882a593Smuzhiyun }
1226*4882a593Smuzhiyun
1227*4882a593Smuzhiyun if (js == dep_js) {
1228*4882a593Smuzhiyun /* Only one same-slot dependency can be
1229*4882a593Smuzhiyun * represented in the ringbuffer
1230*4882a593Smuzhiyun */
1231*4882a593Smuzhiyun if (has_dep) {
1232*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1233*4882a593Smuzhiyun "Too many same-slot deps\n");
1234*4882a593Smuzhiyun ret = false;
1235*4882a593Smuzhiyun break;
1236*4882a593Smuzhiyun }
1237*4882a593Smuzhiyun /* Each dependee atom can only have one
1238*4882a593Smuzhiyun * same-slot dependency
1239*4882a593Smuzhiyun */
1240*4882a593Smuzhiyun if (dep_atom->post_dep) {
1241*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1242*4882a593Smuzhiyun "Too many same-slot successors\n");
1243*4882a593Smuzhiyun ret = false;
1244*4882a593Smuzhiyun break;
1245*4882a593Smuzhiyun }
1246*4882a593Smuzhiyun has_dep = true;
1247*4882a593Smuzhiyun } else {
1248*4882a593Smuzhiyun /* Only one cross-slot dependency can be
1249*4882a593Smuzhiyun * represented in the ringbuffer
1250*4882a593Smuzhiyun */
1251*4882a593Smuzhiyun if (has_x_dep) {
1252*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1253*4882a593Smuzhiyun "Too many cross-slot deps\n");
1254*4882a593Smuzhiyun ret = false;
1255*4882a593Smuzhiyun break;
1256*4882a593Smuzhiyun }
1257*4882a593Smuzhiyun /* Each dependee atom can only have one
1258*4882a593Smuzhiyun * cross-slot dependency
1259*4882a593Smuzhiyun */
1260*4882a593Smuzhiyun if (dep_atom->x_post_dep) {
1261*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1262*4882a593Smuzhiyun "Too many cross-slot successors\n");
1263*4882a593Smuzhiyun ret = false;
1264*4882a593Smuzhiyun break;
1265*4882a593Smuzhiyun }
1266*4882a593Smuzhiyun /* The dependee atom can not already be in the
1267*4882a593Smuzhiyun * HW access ringbuffer
1268*4882a593Smuzhiyun */
1269*4882a593Smuzhiyun if (dep_atom->gpu_rb_state !=
1270*4882a593Smuzhiyun KBASE_ATOM_GPU_RB_NOT_IN_SLOT_RB) {
1271*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1272*4882a593Smuzhiyun "Blocker already in ringbuffer (state:%d)\n",
1273*4882a593Smuzhiyun dep_atom->gpu_rb_state);
1274*4882a593Smuzhiyun ret = false;
1275*4882a593Smuzhiyun break;
1276*4882a593Smuzhiyun }
1277*4882a593Smuzhiyun /* The dependee atom can not already have
1278*4882a593Smuzhiyun * completed
1279*4882a593Smuzhiyun */
1280*4882a593Smuzhiyun if (dep_atom->status !=
1281*4882a593Smuzhiyun KBASE_JD_ATOM_STATE_IN_JS) {
1282*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1283*4882a593Smuzhiyun "Blocker already completed (status:%d)\n",
1284*4882a593Smuzhiyun dep_atom->status);
1285*4882a593Smuzhiyun ret = false;
1286*4882a593Smuzhiyun break;
1287*4882a593Smuzhiyun }
1288*4882a593Smuzhiyun
1289*4882a593Smuzhiyun has_x_dep = true;
1290*4882a593Smuzhiyun }
1291*4882a593Smuzhiyun
1292*4882a593Smuzhiyun /* Dependency can be represented in ringbuffers */
1293*4882a593Smuzhiyun }
1294*4882a593Smuzhiyun }
1295*4882a593Smuzhiyun
1296*4882a593Smuzhiyun /* If dependencies can be represented by ringbuffer then clear them from
1297*4882a593Smuzhiyun * atom structure
1298*4882a593Smuzhiyun */
1299*4882a593Smuzhiyun if (ret) {
1300*4882a593Smuzhiyun for (i = 0; i < 2; i++) {
1301*4882a593Smuzhiyun struct kbase_jd_atom *dep_atom = katom->dep[i].atom;
1302*4882a593Smuzhiyun
1303*4882a593Smuzhiyun if (dep_atom) {
1304*4882a593Smuzhiyun int dep_js = kbase_js_get_slot(kbdev, dep_atom);
1305*4882a593Smuzhiyun
1306*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1307*4882a593Smuzhiyun "Clearing dep %d of atom %pK (s:%d) on %pK (s:%d)\n",
1308*4882a593Smuzhiyun i, (void *)katom, js, (void *)dep_atom,
1309*4882a593Smuzhiyun dep_js);
1310*4882a593Smuzhiyun
1311*4882a593Smuzhiyun if ((js != dep_js) &&
1312*4882a593Smuzhiyun (dep_atom->status !=
1313*4882a593Smuzhiyun KBASE_JD_ATOM_STATE_COMPLETED)
1314*4882a593Smuzhiyun && (dep_atom->status !=
1315*4882a593Smuzhiyun KBASE_JD_ATOM_STATE_HW_COMPLETED)
1316*4882a593Smuzhiyun && (dep_atom->status !=
1317*4882a593Smuzhiyun KBASE_JD_ATOM_STATE_UNUSED)) {
1318*4882a593Smuzhiyun
1319*4882a593Smuzhiyun katom->atom_flags |=
1320*4882a593Smuzhiyun KBASE_KATOM_FLAG_X_DEP_BLOCKED;
1321*4882a593Smuzhiyun
1322*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Set X_DEP flag on atom %pK\n",
1323*4882a593Smuzhiyun (void *)katom);
1324*4882a593Smuzhiyun
1325*4882a593Smuzhiyun katom->x_pre_dep = dep_atom;
1326*4882a593Smuzhiyun dep_atom->x_post_dep = katom;
1327*4882a593Smuzhiyun if (kbase_jd_katom_dep_type(
1328*4882a593Smuzhiyun &katom->dep[i]) ==
1329*4882a593Smuzhiyun BASE_JD_DEP_TYPE_DATA)
1330*4882a593Smuzhiyun katom->atom_flags |=
1331*4882a593Smuzhiyun KBASE_KATOM_FLAG_FAIL_BLOCKER;
1332*4882a593Smuzhiyun }
1333*4882a593Smuzhiyun if ((kbase_jd_katom_dep_type(&katom->dep[i])
1334*4882a593Smuzhiyun == BASE_JD_DEP_TYPE_DATA) &&
1335*4882a593Smuzhiyun (js == dep_js)) {
1336*4882a593Smuzhiyun katom->pre_dep = dep_atom;
1337*4882a593Smuzhiyun dep_atom->post_dep = katom;
1338*4882a593Smuzhiyun }
1339*4882a593Smuzhiyun
1340*4882a593Smuzhiyun list_del(&katom->dep_item[i]);
1341*4882a593Smuzhiyun kbase_jd_katom_dep_clear(&katom->dep[i]);
1342*4882a593Smuzhiyun }
1343*4882a593Smuzhiyun }
1344*4882a593Smuzhiyun } else {
1345*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1346*4882a593Smuzhiyun "Deps of atom %pK (s:%d) could not be represented\n",
1347*4882a593Smuzhiyun (void *)katom, js);
1348*4882a593Smuzhiyun }
1349*4882a593Smuzhiyun
1350*4882a593Smuzhiyun return ret;
1351*4882a593Smuzhiyun }
1352*4882a593Smuzhiyun
kbase_js_set_ctx_priority(struct kbase_context * kctx,int new_priority)1353*4882a593Smuzhiyun void kbase_js_set_ctx_priority(struct kbase_context *kctx, int new_priority)
1354*4882a593Smuzhiyun {
1355*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
1356*4882a593Smuzhiyun unsigned int js;
1357*4882a593Smuzhiyun
1358*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
1359*4882a593Smuzhiyun
1360*4882a593Smuzhiyun /* Move kctx to the pullable/upullable list as per the new priority */
1361*4882a593Smuzhiyun if (new_priority != kctx->priority) {
1362*4882a593Smuzhiyun for (js = 0; js < kbdev->gpu_props.num_job_slots; js++) {
1363*4882a593Smuzhiyun if (kctx->slots_pullable & (1 << js))
1364*4882a593Smuzhiyun list_move_tail(&kctx->jctx.sched_info.ctx.ctx_list_entry[js],
1365*4882a593Smuzhiyun &kbdev->js_data.ctx_list_pullable[js][new_priority]);
1366*4882a593Smuzhiyun else
1367*4882a593Smuzhiyun list_move_tail(&kctx->jctx.sched_info.ctx.ctx_list_entry[js],
1368*4882a593Smuzhiyun &kbdev->js_data.ctx_list_unpullable[js][new_priority]);
1369*4882a593Smuzhiyun }
1370*4882a593Smuzhiyun
1371*4882a593Smuzhiyun kctx->priority = new_priority;
1372*4882a593Smuzhiyun }
1373*4882a593Smuzhiyun }
1374*4882a593Smuzhiyun
kbase_js_update_ctx_priority(struct kbase_context * kctx)1375*4882a593Smuzhiyun void kbase_js_update_ctx_priority(struct kbase_context *kctx)
1376*4882a593Smuzhiyun {
1377*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
1378*4882a593Smuzhiyun int new_priority = KBASE_JS_ATOM_SCHED_PRIO_LOW;
1379*4882a593Smuzhiyun int prio;
1380*4882a593Smuzhiyun
1381*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
1382*4882a593Smuzhiyun
1383*4882a593Smuzhiyun if (kbdev->js_ctx_scheduling_mode == KBASE_JS_SYSTEM_PRIORITY_MODE) {
1384*4882a593Smuzhiyun /* Determine the new priority for context, as per the priority
1385*4882a593Smuzhiyun * of currently in-use atoms.
1386*4882a593Smuzhiyun */
1387*4882a593Smuzhiyun for (prio = KBASE_JS_ATOM_SCHED_PRIO_FIRST;
1388*4882a593Smuzhiyun prio < KBASE_JS_ATOM_SCHED_PRIO_COUNT; prio++) {
1389*4882a593Smuzhiyun if (kctx->atoms_count[prio]) {
1390*4882a593Smuzhiyun new_priority = prio;
1391*4882a593Smuzhiyun break;
1392*4882a593Smuzhiyun }
1393*4882a593Smuzhiyun }
1394*4882a593Smuzhiyun }
1395*4882a593Smuzhiyun
1396*4882a593Smuzhiyun kbase_js_set_ctx_priority(kctx, new_priority);
1397*4882a593Smuzhiyun }
1398*4882a593Smuzhiyun KBASE_EXPORT_TEST_API(kbase_js_update_ctx_priority);
1399*4882a593Smuzhiyun
1400*4882a593Smuzhiyun /**
1401*4882a593Smuzhiyun * js_add_start_rp() - Add an atom that starts a renderpass to the job scheduler
1402*4882a593Smuzhiyun * @start_katom: Pointer to the atom to be added.
1403*4882a593Smuzhiyun * Return: 0 if successful or a negative value on failure.
1404*4882a593Smuzhiyun */
js_add_start_rp(struct kbase_jd_atom * const start_katom)1405*4882a593Smuzhiyun static int js_add_start_rp(struct kbase_jd_atom *const start_katom)
1406*4882a593Smuzhiyun {
1407*4882a593Smuzhiyun struct kbase_context *const kctx = start_katom->kctx;
1408*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
1409*4882a593Smuzhiyun struct kbase_device *const kbdev = kctx->kbdev;
1410*4882a593Smuzhiyun unsigned long flags;
1411*4882a593Smuzhiyun
1412*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
1413*4882a593Smuzhiyun
1414*4882a593Smuzhiyun if (WARN_ON(!(start_katom->core_req & BASE_JD_REQ_START_RENDERPASS)))
1415*4882a593Smuzhiyun return -EINVAL;
1416*4882a593Smuzhiyun
1417*4882a593Smuzhiyun if (start_katom->core_req & BASE_JD_REQ_END_RENDERPASS)
1418*4882a593Smuzhiyun return -EINVAL;
1419*4882a593Smuzhiyun
1420*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(start_katom->renderpass_id) * 8)) <=
1421*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
1422*4882a593Smuzhiyun "Should check invalid access to renderpasses");
1423*4882a593Smuzhiyun
1424*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[start_katom->renderpass_id];
1425*4882a593Smuzhiyun
1426*4882a593Smuzhiyun if (rp->state != KBASE_JD_RP_COMPLETE)
1427*4882a593Smuzhiyun return -EINVAL;
1428*4882a593Smuzhiyun
1429*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "JS add start atom %pK of RP %d\n",
1430*4882a593Smuzhiyun (void *)start_katom, start_katom->renderpass_id);
1431*4882a593Smuzhiyun
1432*4882a593Smuzhiyun /* The following members are read when updating the job slot
1433*4882a593Smuzhiyun * ringbuffer/fifo therefore they require additional locking.
1434*4882a593Smuzhiyun */
1435*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
1436*4882a593Smuzhiyun
1437*4882a593Smuzhiyun rp->state = KBASE_JD_RP_START;
1438*4882a593Smuzhiyun rp->start_katom = start_katom;
1439*4882a593Smuzhiyun rp->end_katom = NULL;
1440*4882a593Smuzhiyun INIT_LIST_HEAD(&rp->oom_reg_list);
1441*4882a593Smuzhiyun
1442*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1443*4882a593Smuzhiyun
1444*4882a593Smuzhiyun return 0;
1445*4882a593Smuzhiyun }
1446*4882a593Smuzhiyun
1447*4882a593Smuzhiyun /**
1448*4882a593Smuzhiyun * js_add_end_rp() - Add an atom that ends a renderpass to the job scheduler
1449*4882a593Smuzhiyun * @end_katom: Pointer to the atom to be added.
1450*4882a593Smuzhiyun * Return: 0 if successful or a negative value on failure.
1451*4882a593Smuzhiyun */
js_add_end_rp(struct kbase_jd_atom * const end_katom)1452*4882a593Smuzhiyun static int js_add_end_rp(struct kbase_jd_atom *const end_katom)
1453*4882a593Smuzhiyun {
1454*4882a593Smuzhiyun struct kbase_context *const kctx = end_katom->kctx;
1455*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
1456*4882a593Smuzhiyun struct kbase_device *const kbdev = kctx->kbdev;
1457*4882a593Smuzhiyun
1458*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
1459*4882a593Smuzhiyun
1460*4882a593Smuzhiyun if (WARN_ON(!(end_katom->core_req & BASE_JD_REQ_END_RENDERPASS)))
1461*4882a593Smuzhiyun return -EINVAL;
1462*4882a593Smuzhiyun
1463*4882a593Smuzhiyun if (end_katom->core_req & BASE_JD_REQ_START_RENDERPASS)
1464*4882a593Smuzhiyun return -EINVAL;
1465*4882a593Smuzhiyun
1466*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(end_katom->renderpass_id) * 8)) <=
1467*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
1468*4882a593Smuzhiyun "Should check invalid access to renderpasses");
1469*4882a593Smuzhiyun
1470*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[end_katom->renderpass_id];
1471*4882a593Smuzhiyun
1472*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS add end atom %pK in state %d of RP %d\n",
1473*4882a593Smuzhiyun (void *)end_katom, (int)rp->state, end_katom->renderpass_id);
1474*4882a593Smuzhiyun
1475*4882a593Smuzhiyun if (rp->state == KBASE_JD_RP_COMPLETE)
1476*4882a593Smuzhiyun return -EINVAL;
1477*4882a593Smuzhiyun
1478*4882a593Smuzhiyun if (rp->end_katom == NULL) {
1479*4882a593Smuzhiyun /* We can't be in a retry state until the fragment job chain
1480*4882a593Smuzhiyun * has completed.
1481*4882a593Smuzhiyun */
1482*4882a593Smuzhiyun unsigned long flags;
1483*4882a593Smuzhiyun
1484*4882a593Smuzhiyun WARN_ON(rp->state == KBASE_JD_RP_RETRY);
1485*4882a593Smuzhiyun WARN_ON(rp->state == KBASE_JD_RP_RETRY_PEND_OOM);
1486*4882a593Smuzhiyun WARN_ON(rp->state == KBASE_JD_RP_RETRY_OOM);
1487*4882a593Smuzhiyun
1488*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
1489*4882a593Smuzhiyun rp->end_katom = end_katom;
1490*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1491*4882a593Smuzhiyun } else
1492*4882a593Smuzhiyun WARN_ON(rp->end_katom != end_katom);
1493*4882a593Smuzhiyun
1494*4882a593Smuzhiyun return 0;
1495*4882a593Smuzhiyun }
1496*4882a593Smuzhiyun
kbasep_js_add_job(struct kbase_context * kctx,struct kbase_jd_atom * atom)1497*4882a593Smuzhiyun bool kbasep_js_add_job(struct kbase_context *kctx,
1498*4882a593Smuzhiyun struct kbase_jd_atom *atom)
1499*4882a593Smuzhiyun {
1500*4882a593Smuzhiyun unsigned long flags;
1501*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
1502*4882a593Smuzhiyun struct kbase_device *kbdev;
1503*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
1504*4882a593Smuzhiyun int err = 0;
1505*4882a593Smuzhiyun
1506*4882a593Smuzhiyun bool enqueue_required = false;
1507*4882a593Smuzhiyun bool timer_sync = false;
1508*4882a593Smuzhiyun
1509*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
1510*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(atom != NULL);
1511*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
1512*4882a593Smuzhiyun
1513*4882a593Smuzhiyun kbdev = kctx->kbdev;
1514*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
1515*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
1516*4882a593Smuzhiyun
1517*4882a593Smuzhiyun mutex_lock(&js_devdata->queue_mutex);
1518*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
1519*4882a593Smuzhiyun
1520*4882a593Smuzhiyun if (atom->core_req & BASE_JD_REQ_START_RENDERPASS)
1521*4882a593Smuzhiyun err = js_add_start_rp(atom);
1522*4882a593Smuzhiyun else if (atom->core_req & BASE_JD_REQ_END_RENDERPASS)
1523*4882a593Smuzhiyun err = js_add_end_rp(atom);
1524*4882a593Smuzhiyun
1525*4882a593Smuzhiyun if (err < 0) {
1526*4882a593Smuzhiyun atom->event_code = BASE_JD_EVENT_JOB_INVALID;
1527*4882a593Smuzhiyun atom->status = KBASE_JD_ATOM_STATE_COMPLETED;
1528*4882a593Smuzhiyun goto out_unlock;
1529*4882a593Smuzhiyun }
1530*4882a593Smuzhiyun
1531*4882a593Smuzhiyun /*
1532*4882a593Smuzhiyun * Begin Runpool transaction
1533*4882a593Smuzhiyun */
1534*4882a593Smuzhiyun mutex_lock(&js_devdata->runpool_mutex);
1535*4882a593Smuzhiyun
1536*4882a593Smuzhiyun /* Refcount ctx.nr_jobs */
1537*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(js_kctx_info->ctx.nr_jobs < U32_MAX);
1538*4882a593Smuzhiyun ++(js_kctx_info->ctx.nr_jobs);
1539*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Add atom %pK to kctx %pK; now %d in ctx\n",
1540*4882a593Smuzhiyun (void *)atom, (void *)kctx, js_kctx_info->ctx.nr_jobs);
1541*4882a593Smuzhiyun
1542*4882a593Smuzhiyun /* Lock for state available during IRQ */
1543*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
1544*4882a593Smuzhiyun
1545*4882a593Smuzhiyun if (++kctx->atoms_count[atom->sched_priority] == 1)
1546*4882a593Smuzhiyun kbase_js_update_ctx_priority(kctx);
1547*4882a593Smuzhiyun
1548*4882a593Smuzhiyun if (!kbase_js_dep_validate(kctx, atom)) {
1549*4882a593Smuzhiyun /* Dependencies could not be represented */
1550*4882a593Smuzhiyun --(js_kctx_info->ctx.nr_jobs);
1551*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1552*4882a593Smuzhiyun "Remove atom %pK from kctx %pK; now %d in ctx\n",
1553*4882a593Smuzhiyun (void *)atom, (void *)kctx, js_kctx_info->ctx.nr_jobs);
1554*4882a593Smuzhiyun
1555*4882a593Smuzhiyun /* Setting atom status back to queued as it still has unresolved
1556*4882a593Smuzhiyun * dependencies
1557*4882a593Smuzhiyun */
1558*4882a593Smuzhiyun atom->status = KBASE_JD_ATOM_STATE_QUEUED;
1559*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Atom %pK status to queued\n", (void *)atom);
1560*4882a593Smuzhiyun
1561*4882a593Smuzhiyun /* Undo the count, as the atom will get added again later but
1562*4882a593Smuzhiyun * leave the context priority adjusted or boosted, in case if
1563*4882a593Smuzhiyun * this was the first higher priority atom received for this
1564*4882a593Smuzhiyun * context.
1565*4882a593Smuzhiyun * This will prevent the scenario of priority inversion, where
1566*4882a593Smuzhiyun * another context having medium priority atoms keeps getting
1567*4882a593Smuzhiyun * scheduled over this context, which is having both lower and
1568*4882a593Smuzhiyun * higher priority atoms, but higher priority atoms are blocked
1569*4882a593Smuzhiyun * due to dependency on lower priority atoms. With priority
1570*4882a593Smuzhiyun * boost the high priority atom will get to run at earliest.
1571*4882a593Smuzhiyun */
1572*4882a593Smuzhiyun kctx->atoms_count[atom->sched_priority]--;
1573*4882a593Smuzhiyun
1574*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1575*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
1576*4882a593Smuzhiyun
1577*4882a593Smuzhiyun goto out_unlock;
1578*4882a593Smuzhiyun }
1579*4882a593Smuzhiyun
1580*4882a593Smuzhiyun enqueue_required = kbase_js_dep_resolved_submit(kctx, atom);
1581*4882a593Smuzhiyun
1582*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_REFCOUNT(kbdev, JS_ADD_JOB, kctx, atom, atom->jc,
1583*4882a593Smuzhiyun kbase_ktrace_get_ctx_refcnt(kctx));
1584*4882a593Smuzhiyun
1585*4882a593Smuzhiyun /* Context Attribute Refcounting */
1586*4882a593Smuzhiyun kbasep_js_ctx_attr_ctx_retain_atom(kbdev, kctx, atom);
1587*4882a593Smuzhiyun
1588*4882a593Smuzhiyun if (enqueue_required) {
1589*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, atom->slot_nr, false))
1590*4882a593Smuzhiyun timer_sync = kbase_js_ctx_list_add_pullable_nolock(
1591*4882a593Smuzhiyun kbdev, kctx, atom->slot_nr);
1592*4882a593Smuzhiyun else
1593*4882a593Smuzhiyun timer_sync = kbase_js_ctx_list_add_unpullable_nolock(
1594*4882a593Smuzhiyun kbdev, kctx, atom->slot_nr);
1595*4882a593Smuzhiyun }
1596*4882a593Smuzhiyun /* If this context is active and the atom is the first on its slot,
1597*4882a593Smuzhiyun * kick the job manager to attempt to fast-start the atom
1598*4882a593Smuzhiyun */
1599*4882a593Smuzhiyun if (enqueue_required && kctx ==
1600*4882a593Smuzhiyun kbdev->hwaccess.active_kctx[atom->slot_nr])
1601*4882a593Smuzhiyun kbase_jm_try_kick(kbdev, 1 << atom->slot_nr);
1602*4882a593Smuzhiyun
1603*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1604*4882a593Smuzhiyun if (timer_sync)
1605*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
1606*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
1607*4882a593Smuzhiyun /* End runpool transaction */
1608*4882a593Smuzhiyun
1609*4882a593Smuzhiyun if (!kbase_ctx_flag(kctx, KCTX_SCHEDULED)) {
1610*4882a593Smuzhiyun if (kbase_ctx_flag(kctx, KCTX_DYING)) {
1611*4882a593Smuzhiyun /* A job got added while/after kbase_job_zap_context()
1612*4882a593Smuzhiyun * was called on a non-scheduled context. Kill that job
1613*4882a593Smuzhiyun * by killing the context.
1614*4882a593Smuzhiyun */
1615*4882a593Smuzhiyun kbasep_js_runpool_requeue_or_kill_ctx(kbdev, kctx,
1616*4882a593Smuzhiyun false);
1617*4882a593Smuzhiyun } else if (js_kctx_info->ctx.nr_jobs == 1) {
1618*4882a593Smuzhiyun /* Handle Refcount going from 0 to 1: schedule the
1619*4882a593Smuzhiyun * context on the Queue
1620*4882a593Smuzhiyun */
1621*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(!kbase_ctx_flag(kctx, KCTX_SCHEDULED));
1622*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: Enqueue Context %pK", kctx);
1623*4882a593Smuzhiyun
1624*4882a593Smuzhiyun /* Queue was updated - caller must try to schedule the
1625*4882a593Smuzhiyun * head context
1626*4882a593Smuzhiyun */
1627*4882a593Smuzhiyun WARN_ON(!enqueue_required);
1628*4882a593Smuzhiyun }
1629*4882a593Smuzhiyun }
1630*4882a593Smuzhiyun out_unlock:
1631*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Enqueue of kctx %pK is %srequired\n",
1632*4882a593Smuzhiyun kctx, enqueue_required ? "" : "not ");
1633*4882a593Smuzhiyun
1634*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
1635*4882a593Smuzhiyun
1636*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
1637*4882a593Smuzhiyun
1638*4882a593Smuzhiyun return enqueue_required;
1639*4882a593Smuzhiyun }
1640*4882a593Smuzhiyun
kbasep_js_remove_job(struct kbase_device * kbdev,struct kbase_context * kctx,struct kbase_jd_atom * atom)1641*4882a593Smuzhiyun void kbasep_js_remove_job(struct kbase_device *kbdev,
1642*4882a593Smuzhiyun struct kbase_context *kctx, struct kbase_jd_atom *atom)
1643*4882a593Smuzhiyun {
1644*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
1645*4882a593Smuzhiyun unsigned long flags;
1646*4882a593Smuzhiyun
1647*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
1648*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
1649*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(atom != NULL);
1650*4882a593Smuzhiyun
1651*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
1652*4882a593Smuzhiyun
1653*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_REFCOUNT(kbdev, JS_REMOVE_JOB, kctx, atom, atom->jc,
1654*4882a593Smuzhiyun kbase_ktrace_get_ctx_refcnt(kctx));
1655*4882a593Smuzhiyun
1656*4882a593Smuzhiyun /* De-refcount ctx.nr_jobs */
1657*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(js_kctx_info->ctx.nr_jobs > 0);
1658*4882a593Smuzhiyun --(js_kctx_info->ctx.nr_jobs);
1659*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1660*4882a593Smuzhiyun "Remove atom %pK from kctx %pK; now %d in ctx\n",
1661*4882a593Smuzhiyun (void *)atom, (void *)kctx, js_kctx_info->ctx.nr_jobs);
1662*4882a593Smuzhiyun
1663*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
1664*4882a593Smuzhiyun if (--kctx->atoms_count[atom->sched_priority] == 0)
1665*4882a593Smuzhiyun kbase_js_update_ctx_priority(kctx);
1666*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1667*4882a593Smuzhiyun }
1668*4882a593Smuzhiyun
kbasep_js_remove_cancelled_job(struct kbase_device * kbdev,struct kbase_context * kctx,struct kbase_jd_atom * katom)1669*4882a593Smuzhiyun bool kbasep_js_remove_cancelled_job(struct kbase_device *kbdev,
1670*4882a593Smuzhiyun struct kbase_context *kctx, struct kbase_jd_atom *katom)
1671*4882a593Smuzhiyun {
1672*4882a593Smuzhiyun unsigned long flags;
1673*4882a593Smuzhiyun struct kbasep_js_atom_retained_state katom_retained_state;
1674*4882a593Smuzhiyun bool attr_state_changed;
1675*4882a593Smuzhiyun
1676*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
1677*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
1678*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(katom != NULL);
1679*4882a593Smuzhiyun
1680*4882a593Smuzhiyun kbasep_js_atom_retained_state_copy(&katom_retained_state, katom);
1681*4882a593Smuzhiyun kbasep_js_remove_job(kbdev, kctx, katom);
1682*4882a593Smuzhiyun
1683*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
1684*4882a593Smuzhiyun
1685*4882a593Smuzhiyun /* The atom has 'finished' (will not be re-run), so no need to call
1686*4882a593Smuzhiyun * kbasep_js_has_atom_finished().
1687*4882a593Smuzhiyun *
1688*4882a593Smuzhiyun * This is because it returns false for soft-stopped atoms, but we
1689*4882a593Smuzhiyun * want to override that, because we're cancelling an atom regardless of
1690*4882a593Smuzhiyun * whether it was soft-stopped or not
1691*4882a593Smuzhiyun */
1692*4882a593Smuzhiyun attr_state_changed = kbasep_js_ctx_attr_ctx_release_atom(kbdev, kctx,
1693*4882a593Smuzhiyun &katom_retained_state);
1694*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1695*4882a593Smuzhiyun
1696*4882a593Smuzhiyun return attr_state_changed;
1697*4882a593Smuzhiyun }
1698*4882a593Smuzhiyun
1699*4882a593Smuzhiyun /**
1700*4882a593Smuzhiyun * kbasep_js_run_jobs_after_ctx_and_atom_release - Try running more jobs after
1701*4882a593Smuzhiyun * releasing a context and/or atom
1702*4882a593Smuzhiyun * @kbdev: The kbase_device to operate on
1703*4882a593Smuzhiyun * @kctx: The kbase_context to operate on
1704*4882a593Smuzhiyun * @katom_retained_state: Retained state from the atom
1705*4882a593Smuzhiyun * @runpool_ctx_attr_change: True if the runpool context attributes have changed
1706*4882a593Smuzhiyun *
1707*4882a593Smuzhiyun * This collates a set of actions that must happen whilst hwaccess_lock is held.
1708*4882a593Smuzhiyun *
1709*4882a593Smuzhiyun * This includes running more jobs when:
1710*4882a593Smuzhiyun * - The previously released kctx caused a ctx attribute change,
1711*4882a593Smuzhiyun * - The released atom caused a ctx attribute change,
1712*4882a593Smuzhiyun * - Slots were previously blocked due to affinity restrictions,
1713*4882a593Smuzhiyun * - Submission during IRQ handling failed.
1714*4882a593Smuzhiyun *
1715*4882a593Smuzhiyun * Return: %KBASEP_JS_RELEASE_RESULT_SCHED_ALL if context attributes were
1716*4882a593Smuzhiyun * changed. The caller should try scheduling all contexts
1717*4882a593Smuzhiyun */
kbasep_js_run_jobs_after_ctx_and_atom_release(struct kbase_device * kbdev,struct kbase_context * kctx,struct kbasep_js_atom_retained_state * katom_retained_state,bool runpool_ctx_attr_change)1718*4882a593Smuzhiyun static kbasep_js_release_result kbasep_js_run_jobs_after_ctx_and_atom_release(
1719*4882a593Smuzhiyun struct kbase_device *kbdev,
1720*4882a593Smuzhiyun struct kbase_context *kctx,
1721*4882a593Smuzhiyun struct kbasep_js_atom_retained_state *katom_retained_state,
1722*4882a593Smuzhiyun bool runpool_ctx_attr_change)
1723*4882a593Smuzhiyun {
1724*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
1725*4882a593Smuzhiyun kbasep_js_release_result result = 0;
1726*4882a593Smuzhiyun
1727*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
1728*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
1729*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(katom_retained_state != NULL);
1730*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
1731*4882a593Smuzhiyun
1732*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.sched_info.ctx.jsctx_mutex);
1733*4882a593Smuzhiyun lockdep_assert_held(&js_devdata->runpool_mutex);
1734*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
1735*4882a593Smuzhiyun
1736*4882a593Smuzhiyun if (js_devdata->nr_user_contexts_running != 0 && runpool_ctx_attr_change) {
1737*4882a593Smuzhiyun /* A change in runpool ctx attributes might mean we can
1738*4882a593Smuzhiyun * run more jobs than before
1739*4882a593Smuzhiyun */
1740*4882a593Smuzhiyun result = KBASEP_JS_RELEASE_RESULT_SCHED_ALL;
1741*4882a593Smuzhiyun
1742*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_SLOT(kbdev, JD_DONE_TRY_RUN_NEXT_JOB,
1743*4882a593Smuzhiyun kctx, NULL, 0u, 0);
1744*4882a593Smuzhiyun }
1745*4882a593Smuzhiyun return result;
1746*4882a593Smuzhiyun }
1747*4882a593Smuzhiyun
1748*4882a593Smuzhiyun /**
1749*4882a593Smuzhiyun * kbasep_js_runpool_release_ctx_internal - Internal function to release the reference
1750*4882a593Smuzhiyun * on a ctx and an atom's "retained state", only
1751*4882a593Smuzhiyun * taking the runpool and as transaction mutexes
1752*4882a593Smuzhiyun * @kbdev: The kbase_device to operate on
1753*4882a593Smuzhiyun * @kctx: The kbase_context to operate on
1754*4882a593Smuzhiyun * @katom_retained_state: Retained state from the atom
1755*4882a593Smuzhiyun *
1756*4882a593Smuzhiyun * This also starts more jobs running in the case of an ctx-attribute state change
1757*4882a593Smuzhiyun *
1758*4882a593Smuzhiyun * This does none of the followup actions for scheduling:
1759*4882a593Smuzhiyun * - It does not schedule in a new context
1760*4882a593Smuzhiyun * - It does not requeue or handle dying contexts
1761*4882a593Smuzhiyun *
1762*4882a593Smuzhiyun * For those tasks, just call kbasep_js_runpool_release_ctx() instead
1763*4882a593Smuzhiyun *
1764*4882a593Smuzhiyun * Has following requirements
1765*4882a593Smuzhiyun * - Context is scheduled in, and kctx->as_nr matches kctx_as_nr
1766*4882a593Smuzhiyun * - Context has a non-zero refcount
1767*4882a593Smuzhiyun * - Caller holds js_kctx_info->ctx.jsctx_mutex
1768*4882a593Smuzhiyun * - Caller holds js_devdata->runpool_mutex
1769*4882a593Smuzhiyun *
1770*4882a593Smuzhiyun * Return: A bitpattern, containing KBASEP_JS_RELEASE_RESULT_* flags, indicating
1771*4882a593Smuzhiyun * the result of releasing a context that whether the caller should try
1772*4882a593Smuzhiyun * scheduling a new context or should try scheduling all contexts.
1773*4882a593Smuzhiyun */
kbasep_js_runpool_release_ctx_internal(struct kbase_device * kbdev,struct kbase_context * kctx,struct kbasep_js_atom_retained_state * katom_retained_state)1774*4882a593Smuzhiyun static kbasep_js_release_result kbasep_js_runpool_release_ctx_internal(
1775*4882a593Smuzhiyun struct kbase_device *kbdev,
1776*4882a593Smuzhiyun struct kbase_context *kctx,
1777*4882a593Smuzhiyun struct kbasep_js_atom_retained_state *katom_retained_state)
1778*4882a593Smuzhiyun {
1779*4882a593Smuzhiyun unsigned long flags;
1780*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
1781*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
1782*4882a593Smuzhiyun
1783*4882a593Smuzhiyun kbasep_js_release_result release_result = 0u;
1784*4882a593Smuzhiyun bool runpool_ctx_attr_change = false;
1785*4882a593Smuzhiyun int kctx_as_nr;
1786*4882a593Smuzhiyun int new_ref_count;
1787*4882a593Smuzhiyun CSTD_UNUSED(kctx_as_nr);
1788*4882a593Smuzhiyun
1789*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
1790*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
1791*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
1792*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
1793*4882a593Smuzhiyun
1794*4882a593Smuzhiyun /* Ensure context really is scheduled in */
1795*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbase_ctx_flag(kctx, KCTX_SCHEDULED));
1796*4882a593Smuzhiyun
1797*4882a593Smuzhiyun kctx_as_nr = kctx->as_nr;
1798*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx_as_nr != KBASEP_AS_NR_INVALID);
1799*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(atomic_read(&kctx->refcount) > 0);
1800*4882a593Smuzhiyun
1801*4882a593Smuzhiyun /*
1802*4882a593Smuzhiyun * Transaction begins on AS and runpool_irq
1803*4882a593Smuzhiyun *
1804*4882a593Smuzhiyun * Assert about out calling contract
1805*4882a593Smuzhiyun */
1806*4882a593Smuzhiyun mutex_lock(&kbdev->pm.lock);
1807*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
1808*4882a593Smuzhiyun
1809*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx_as_nr == kctx->as_nr);
1810*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(atomic_read(&kctx->refcount) > 0);
1811*4882a593Smuzhiyun
1812*4882a593Smuzhiyun /* Update refcount */
1813*4882a593Smuzhiyun kbase_ctx_sched_release_ctx(kctx);
1814*4882a593Smuzhiyun new_ref_count = atomic_read(&kctx->refcount);
1815*4882a593Smuzhiyun
1816*4882a593Smuzhiyun /* Release the atom if it finished (i.e. wasn't soft-stopped) */
1817*4882a593Smuzhiyun if (kbasep_js_has_atom_finished(katom_retained_state))
1818*4882a593Smuzhiyun runpool_ctx_attr_change |= kbasep_js_ctx_attr_ctx_release_atom(
1819*4882a593Smuzhiyun kbdev, kctx, katom_retained_state);
1820*4882a593Smuzhiyun
1821*4882a593Smuzhiyun if (new_ref_count == 2 && kbase_ctx_flag(kctx, KCTX_PRIVILEGED) &&
1822*4882a593Smuzhiyun #ifdef CONFIG_MALI_ARBITER_SUPPORT
1823*4882a593Smuzhiyun !kbase_pm_is_gpu_lost(kbdev) &&
1824*4882a593Smuzhiyun #endif
1825*4882a593Smuzhiyun !kbase_pm_is_suspending(kbdev)) {
1826*4882a593Smuzhiyun /* Context is kept scheduled into an address space even when
1827*4882a593Smuzhiyun * there are no jobs, in this case we have to handle the
1828*4882a593Smuzhiyun * situation where all jobs have been evicted from the GPU and
1829*4882a593Smuzhiyun * submission is disabled.
1830*4882a593Smuzhiyun *
1831*4882a593Smuzhiyun * At this point we re-enable submission to allow further jobs
1832*4882a593Smuzhiyun * to be executed
1833*4882a593Smuzhiyun */
1834*4882a593Smuzhiyun kbasep_js_set_submit_allowed(js_devdata, kctx);
1835*4882a593Smuzhiyun }
1836*4882a593Smuzhiyun
1837*4882a593Smuzhiyun /* Make a set of checks to see if the context should be scheduled out.
1838*4882a593Smuzhiyun * Note that there'll always be at least 1 reference to the context
1839*4882a593Smuzhiyun * which was previously acquired by kbasep_js_schedule_ctx().
1840*4882a593Smuzhiyun */
1841*4882a593Smuzhiyun if (new_ref_count == 1 &&
1842*4882a593Smuzhiyun (!kbasep_js_is_submit_allowed(js_devdata, kctx) ||
1843*4882a593Smuzhiyun #ifdef CONFIG_MALI_ARBITER_SUPPORT
1844*4882a593Smuzhiyun kbase_pm_is_gpu_lost(kbdev) ||
1845*4882a593Smuzhiyun #endif
1846*4882a593Smuzhiyun kbase_pm_is_suspending(kbdev))) {
1847*4882a593Smuzhiyun int num_slots = kbdev->gpu_props.num_job_slots;
1848*4882a593Smuzhiyun int slot;
1849*4882a593Smuzhiyun
1850*4882a593Smuzhiyun /* Last reference, and we've been told to remove this context
1851*4882a593Smuzhiyun * from the Run Pool
1852*4882a593Smuzhiyun */
1853*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: RunPool Remove Context %pK because refcount=%d, jobs=%d, allowed=%d",
1854*4882a593Smuzhiyun kctx, new_ref_count, js_kctx_info->ctx.nr_jobs,
1855*4882a593Smuzhiyun kbasep_js_is_submit_allowed(js_devdata, kctx));
1856*4882a593Smuzhiyun
1857*4882a593Smuzhiyun KBASE_TLSTREAM_TL_NRET_AS_CTX(kbdev, &kbdev->as[kctx->as_nr], kctx);
1858*4882a593Smuzhiyun
1859*4882a593Smuzhiyun kbase_backend_release_ctx_irq(kbdev, kctx);
1860*4882a593Smuzhiyun
1861*4882a593Smuzhiyun for (slot = 0; slot < num_slots; slot++) {
1862*4882a593Smuzhiyun if (kbdev->hwaccess.active_kctx[slot] == kctx) {
1863*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Marking kctx %pK as inactive (s:%d)\n",
1864*4882a593Smuzhiyun (void *)kctx, slot);
1865*4882a593Smuzhiyun kbdev->hwaccess.active_kctx[slot] = NULL;
1866*4882a593Smuzhiyun }
1867*4882a593Smuzhiyun }
1868*4882a593Smuzhiyun
1869*4882a593Smuzhiyun /* Ctx Attribute handling
1870*4882a593Smuzhiyun *
1871*4882a593Smuzhiyun * Releasing atoms attributes must either happen before this, or
1872*4882a593Smuzhiyun * after the KCTX_SHEDULED flag is changed, otherwise we
1873*4882a593Smuzhiyun * double-decount the attributes
1874*4882a593Smuzhiyun */
1875*4882a593Smuzhiyun runpool_ctx_attr_change |=
1876*4882a593Smuzhiyun kbasep_js_ctx_attr_runpool_release_ctx(kbdev, kctx);
1877*4882a593Smuzhiyun
1878*4882a593Smuzhiyun /* Releasing the context and katom retained state can allow
1879*4882a593Smuzhiyun * more jobs to run
1880*4882a593Smuzhiyun */
1881*4882a593Smuzhiyun release_result |=
1882*4882a593Smuzhiyun kbasep_js_run_jobs_after_ctx_and_atom_release(kbdev,
1883*4882a593Smuzhiyun kctx, katom_retained_state,
1884*4882a593Smuzhiyun runpool_ctx_attr_change);
1885*4882a593Smuzhiyun
1886*4882a593Smuzhiyun /*
1887*4882a593Smuzhiyun * Transaction ends on AS and runpool_irq:
1888*4882a593Smuzhiyun *
1889*4882a593Smuzhiyun * By this point, the AS-related data is now clear and ready
1890*4882a593Smuzhiyun * for re-use.
1891*4882a593Smuzhiyun *
1892*4882a593Smuzhiyun * Since releases only occur once for each previous successful
1893*4882a593Smuzhiyun * retain, and no more retains are allowed on this context, no
1894*4882a593Smuzhiyun * other thread will be operating in this
1895*4882a593Smuzhiyun * code whilst we are
1896*4882a593Smuzhiyun */
1897*4882a593Smuzhiyun
1898*4882a593Smuzhiyun /* Recalculate pullable status for all slots */
1899*4882a593Smuzhiyun for (slot = 0; slot < num_slots; slot++) {
1900*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, slot, false))
1901*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(kbdev,
1902*4882a593Smuzhiyun kctx, slot);
1903*4882a593Smuzhiyun }
1904*4882a593Smuzhiyun
1905*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1906*4882a593Smuzhiyun
1907*4882a593Smuzhiyun kbase_backend_release_ctx_noirq(kbdev, kctx);
1908*4882a593Smuzhiyun
1909*4882a593Smuzhiyun mutex_unlock(&kbdev->pm.lock);
1910*4882a593Smuzhiyun
1911*4882a593Smuzhiyun /* Note: Don't reuse kctx_as_nr now */
1912*4882a593Smuzhiyun
1913*4882a593Smuzhiyun /* Synchronize with any timers */
1914*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
1915*4882a593Smuzhiyun
1916*4882a593Smuzhiyun /* update book-keeping info */
1917*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_SCHEDULED);
1918*4882a593Smuzhiyun /* Signal any waiter that the context is not scheduled, so is
1919*4882a593Smuzhiyun * safe for termination - once the jsctx_mutex is also dropped,
1920*4882a593Smuzhiyun * and jobs have finished.
1921*4882a593Smuzhiyun */
1922*4882a593Smuzhiyun wake_up(&js_kctx_info->ctx.is_scheduled_wait);
1923*4882a593Smuzhiyun
1924*4882a593Smuzhiyun /* Queue an action to occur after we've dropped the lock */
1925*4882a593Smuzhiyun release_result |= KBASEP_JS_RELEASE_RESULT_WAS_DESCHEDULED |
1926*4882a593Smuzhiyun KBASEP_JS_RELEASE_RESULT_SCHED_ALL;
1927*4882a593Smuzhiyun } else {
1928*4882a593Smuzhiyun kbasep_js_run_jobs_after_ctx_and_atom_release(kbdev, kctx,
1929*4882a593Smuzhiyun katom_retained_state, runpool_ctx_attr_change);
1930*4882a593Smuzhiyun
1931*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
1932*4882a593Smuzhiyun mutex_unlock(&kbdev->pm.lock);
1933*4882a593Smuzhiyun }
1934*4882a593Smuzhiyun
1935*4882a593Smuzhiyun return release_result;
1936*4882a593Smuzhiyun }
1937*4882a593Smuzhiyun
kbasep_js_runpool_release_ctx_nolock(struct kbase_device * kbdev,struct kbase_context * kctx)1938*4882a593Smuzhiyun void kbasep_js_runpool_release_ctx_nolock(struct kbase_device *kbdev,
1939*4882a593Smuzhiyun struct kbase_context *kctx)
1940*4882a593Smuzhiyun {
1941*4882a593Smuzhiyun struct kbasep_js_atom_retained_state katom_retained_state;
1942*4882a593Smuzhiyun
1943*4882a593Smuzhiyun /* Setup a dummy katom_retained_state */
1944*4882a593Smuzhiyun kbasep_js_atom_retained_state_init_invalid(&katom_retained_state);
1945*4882a593Smuzhiyun
1946*4882a593Smuzhiyun kbasep_js_runpool_release_ctx_internal(kbdev, kctx,
1947*4882a593Smuzhiyun &katom_retained_state);
1948*4882a593Smuzhiyun }
1949*4882a593Smuzhiyun
kbasep_js_runpool_requeue_or_kill_ctx(struct kbase_device * kbdev,struct kbase_context * kctx,bool has_pm_ref)1950*4882a593Smuzhiyun void kbasep_js_runpool_requeue_or_kill_ctx(struct kbase_device *kbdev,
1951*4882a593Smuzhiyun struct kbase_context *kctx, bool has_pm_ref)
1952*4882a593Smuzhiyun {
1953*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
1954*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
1955*4882a593Smuzhiyun
1956*4882a593Smuzhiyun /* This is called if and only if you've you've detached the context from
1957*4882a593Smuzhiyun * the Runpool Queue, and not added it back to the Runpool
1958*4882a593Smuzhiyun */
1959*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(!kbase_ctx_flag(kctx, KCTX_SCHEDULED));
1960*4882a593Smuzhiyun
1961*4882a593Smuzhiyun if (kbase_ctx_flag(kctx, KCTX_DYING)) {
1962*4882a593Smuzhiyun /* Dying: don't requeue, but kill all jobs on the context. This
1963*4882a593Smuzhiyun * happens asynchronously
1964*4882a593Smuzhiyun */
1965*4882a593Smuzhiyun dev_dbg(kbdev->dev,
1966*4882a593Smuzhiyun "JS: ** Killing Context %pK on RunPool Remove **", kctx);
1967*4882a593Smuzhiyun kbase_js_foreach_ctx_job(kctx, &kbase_jd_cancel);
1968*4882a593Smuzhiyun }
1969*4882a593Smuzhiyun }
1970*4882a593Smuzhiyun
kbasep_js_runpool_release_ctx_and_katom_retained_state(struct kbase_device * kbdev,struct kbase_context * kctx,struct kbasep_js_atom_retained_state * katom_retained_state)1971*4882a593Smuzhiyun void kbasep_js_runpool_release_ctx_and_katom_retained_state(
1972*4882a593Smuzhiyun struct kbase_device *kbdev, struct kbase_context *kctx,
1973*4882a593Smuzhiyun struct kbasep_js_atom_retained_state *katom_retained_state)
1974*4882a593Smuzhiyun {
1975*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
1976*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
1977*4882a593Smuzhiyun kbasep_js_release_result release_result;
1978*4882a593Smuzhiyun
1979*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
1980*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
1981*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
1982*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
1983*4882a593Smuzhiyun
1984*4882a593Smuzhiyun mutex_lock(&js_devdata->queue_mutex);
1985*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
1986*4882a593Smuzhiyun mutex_lock(&js_devdata->runpool_mutex);
1987*4882a593Smuzhiyun
1988*4882a593Smuzhiyun release_result = kbasep_js_runpool_release_ctx_internal(kbdev, kctx,
1989*4882a593Smuzhiyun katom_retained_state);
1990*4882a593Smuzhiyun
1991*4882a593Smuzhiyun /* Drop the runpool mutex to allow requeing kctx */
1992*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
1993*4882a593Smuzhiyun
1994*4882a593Smuzhiyun if ((release_result & KBASEP_JS_RELEASE_RESULT_WAS_DESCHEDULED) != 0u)
1995*4882a593Smuzhiyun kbasep_js_runpool_requeue_or_kill_ctx(kbdev, kctx, true);
1996*4882a593Smuzhiyun
1997*4882a593Smuzhiyun /* Drop the jsctx_mutex to allow scheduling in a new context */
1998*4882a593Smuzhiyun
1999*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2000*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
2001*4882a593Smuzhiyun
2002*4882a593Smuzhiyun if (release_result & KBASEP_JS_RELEASE_RESULT_SCHED_ALL)
2003*4882a593Smuzhiyun kbase_js_sched_all(kbdev);
2004*4882a593Smuzhiyun }
2005*4882a593Smuzhiyun
kbasep_js_runpool_release_ctx(struct kbase_device * kbdev,struct kbase_context * kctx)2006*4882a593Smuzhiyun void kbasep_js_runpool_release_ctx(struct kbase_device *kbdev,
2007*4882a593Smuzhiyun struct kbase_context *kctx)
2008*4882a593Smuzhiyun {
2009*4882a593Smuzhiyun struct kbasep_js_atom_retained_state katom_retained_state;
2010*4882a593Smuzhiyun
2011*4882a593Smuzhiyun kbasep_js_atom_retained_state_init_invalid(&katom_retained_state);
2012*4882a593Smuzhiyun
2013*4882a593Smuzhiyun kbasep_js_runpool_release_ctx_and_katom_retained_state(kbdev, kctx,
2014*4882a593Smuzhiyun &katom_retained_state);
2015*4882a593Smuzhiyun }
2016*4882a593Smuzhiyun
2017*4882a593Smuzhiyun /* Variant of kbasep_js_runpool_release_ctx() that doesn't call into
2018*4882a593Smuzhiyun * kbase_js_sched_all()
2019*4882a593Smuzhiyun */
kbasep_js_runpool_release_ctx_no_schedule(struct kbase_device * kbdev,struct kbase_context * kctx)2020*4882a593Smuzhiyun static void kbasep_js_runpool_release_ctx_no_schedule(
2021*4882a593Smuzhiyun struct kbase_device *kbdev, struct kbase_context *kctx)
2022*4882a593Smuzhiyun {
2023*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
2024*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
2025*4882a593Smuzhiyun kbasep_js_release_result release_result;
2026*4882a593Smuzhiyun struct kbasep_js_atom_retained_state katom_retained_state_struct;
2027*4882a593Smuzhiyun struct kbasep_js_atom_retained_state *katom_retained_state =
2028*4882a593Smuzhiyun &katom_retained_state_struct;
2029*4882a593Smuzhiyun
2030*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
2031*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
2032*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
2033*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
2034*4882a593Smuzhiyun kbasep_js_atom_retained_state_init_invalid(katom_retained_state);
2035*4882a593Smuzhiyun
2036*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
2037*4882a593Smuzhiyun mutex_lock(&js_devdata->runpool_mutex);
2038*4882a593Smuzhiyun
2039*4882a593Smuzhiyun release_result = kbasep_js_runpool_release_ctx_internal(kbdev, kctx,
2040*4882a593Smuzhiyun katom_retained_state);
2041*4882a593Smuzhiyun
2042*4882a593Smuzhiyun /* Drop the runpool mutex to allow requeing kctx */
2043*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
2044*4882a593Smuzhiyun if ((release_result & KBASEP_JS_RELEASE_RESULT_WAS_DESCHEDULED) != 0u)
2045*4882a593Smuzhiyun kbasep_js_runpool_requeue_or_kill_ctx(kbdev, kctx, true);
2046*4882a593Smuzhiyun
2047*4882a593Smuzhiyun /* Drop the jsctx_mutex to allow scheduling in a new context */
2048*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2049*4882a593Smuzhiyun
2050*4882a593Smuzhiyun /* NOTE: could return release_result if the caller would like to know
2051*4882a593Smuzhiyun * whether it should schedule a new context, but currently no callers do
2052*4882a593Smuzhiyun */
2053*4882a593Smuzhiyun }
2054*4882a593Smuzhiyun
kbase_js_set_timeouts(struct kbase_device * kbdev)2055*4882a593Smuzhiyun void kbase_js_set_timeouts(struct kbase_device *kbdev)
2056*4882a593Smuzhiyun {
2057*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
2058*4882a593Smuzhiyun
2059*4882a593Smuzhiyun kbase_backend_timeouts_changed(kbdev);
2060*4882a593Smuzhiyun }
2061*4882a593Smuzhiyun
kbasep_js_schedule_ctx(struct kbase_device * kbdev,struct kbase_context * kctx,unsigned int js)2062*4882a593Smuzhiyun static bool kbasep_js_schedule_ctx(struct kbase_device *kbdev, struct kbase_context *kctx,
2063*4882a593Smuzhiyun unsigned int js)
2064*4882a593Smuzhiyun {
2065*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
2066*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
2067*4882a593Smuzhiyun unsigned long flags;
2068*4882a593Smuzhiyun bool kctx_suspended = false;
2069*4882a593Smuzhiyun int as_nr;
2070*4882a593Smuzhiyun
2071*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Scheduling kctx %pK (s:%u)\n", kctx, js);
2072*4882a593Smuzhiyun
2073*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
2074*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
2075*4882a593Smuzhiyun
2076*4882a593Smuzhiyun /* Pick available address space for this context */
2077*4882a593Smuzhiyun mutex_lock(&kbdev->mmu_hw_mutex);
2078*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2079*4882a593Smuzhiyun as_nr = kbase_ctx_sched_retain_ctx(kctx);
2080*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2081*4882a593Smuzhiyun mutex_unlock(&kbdev->mmu_hw_mutex);
2082*4882a593Smuzhiyun if (as_nr == KBASEP_AS_NR_INVALID) {
2083*4882a593Smuzhiyun as_nr = kbase_backend_find_and_release_free_address_space(
2084*4882a593Smuzhiyun kbdev, kctx);
2085*4882a593Smuzhiyun if (as_nr != KBASEP_AS_NR_INVALID) {
2086*4882a593Smuzhiyun /* Attempt to retain the context again, this should
2087*4882a593Smuzhiyun * succeed
2088*4882a593Smuzhiyun */
2089*4882a593Smuzhiyun mutex_lock(&kbdev->mmu_hw_mutex);
2090*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2091*4882a593Smuzhiyun as_nr = kbase_ctx_sched_retain_ctx(kctx);
2092*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2093*4882a593Smuzhiyun mutex_unlock(&kbdev->mmu_hw_mutex);
2094*4882a593Smuzhiyun
2095*4882a593Smuzhiyun WARN_ON(as_nr == KBASEP_AS_NR_INVALID);
2096*4882a593Smuzhiyun }
2097*4882a593Smuzhiyun }
2098*4882a593Smuzhiyun if ((as_nr < 0) || (as_nr >= BASE_MAX_NR_AS))
2099*4882a593Smuzhiyun return false; /* No address space currently available */
2100*4882a593Smuzhiyun
2101*4882a593Smuzhiyun /*
2102*4882a593Smuzhiyun * Atomic transaction on the Context and Run Pool begins
2103*4882a593Smuzhiyun */
2104*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
2105*4882a593Smuzhiyun mutex_lock(&js_devdata->runpool_mutex);
2106*4882a593Smuzhiyun mutex_lock(&kbdev->mmu_hw_mutex);
2107*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2108*4882a593Smuzhiyun
2109*4882a593Smuzhiyun /* Check to see if context is dying due to kbase_job_zap_context() */
2110*4882a593Smuzhiyun if (kbase_ctx_flag(kctx, KCTX_DYING)) {
2111*4882a593Smuzhiyun /* Roll back the transaction so far and return */
2112*4882a593Smuzhiyun kbase_ctx_sched_release_ctx(kctx);
2113*4882a593Smuzhiyun
2114*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2115*4882a593Smuzhiyun mutex_unlock(&kbdev->mmu_hw_mutex);
2116*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
2117*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2118*4882a593Smuzhiyun
2119*4882a593Smuzhiyun return false;
2120*4882a593Smuzhiyun }
2121*4882a593Smuzhiyun
2122*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_REFCOUNT(kbdev, JS_TRY_SCHEDULE_HEAD_CTX, kctx, NULL,
2123*4882a593Smuzhiyun 0u,
2124*4882a593Smuzhiyun kbase_ktrace_get_ctx_refcnt(kctx));
2125*4882a593Smuzhiyun
2126*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_SCHEDULED);
2127*4882a593Smuzhiyun
2128*4882a593Smuzhiyun /* Assign context to previously chosen address space */
2129*4882a593Smuzhiyun if (!kbase_backend_use_ctx(kbdev, kctx, as_nr)) {
2130*4882a593Smuzhiyun /* Roll back the transaction so far and return */
2131*4882a593Smuzhiyun kbase_ctx_sched_release_ctx(kctx);
2132*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_SCHEDULED);
2133*4882a593Smuzhiyun
2134*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2135*4882a593Smuzhiyun mutex_unlock(&kbdev->mmu_hw_mutex);
2136*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
2137*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2138*4882a593Smuzhiyun
2139*4882a593Smuzhiyun return false;
2140*4882a593Smuzhiyun }
2141*4882a593Smuzhiyun
2142*4882a593Smuzhiyun kbdev->hwaccess.active_kctx[js] = kctx;
2143*4882a593Smuzhiyun
2144*4882a593Smuzhiyun KBASE_TLSTREAM_TL_RET_AS_CTX(kbdev, &kbdev->as[kctx->as_nr], kctx);
2145*4882a593Smuzhiyun
2146*4882a593Smuzhiyun /* Cause any future waiter-on-termination to wait until the context is
2147*4882a593Smuzhiyun * descheduled
2148*4882a593Smuzhiyun */
2149*4882a593Smuzhiyun wake_up(&js_kctx_info->ctx.is_scheduled_wait);
2150*4882a593Smuzhiyun
2151*4882a593Smuzhiyun /* Re-check for suspending: a suspend could've occurred, and all the
2152*4882a593Smuzhiyun * contexts could've been removed from the runpool before we took this
2153*4882a593Smuzhiyun * lock. In this case, we don't want to allow this context to run jobs,
2154*4882a593Smuzhiyun * we just want it out immediately.
2155*4882a593Smuzhiyun *
2156*4882a593Smuzhiyun * The DMB required to read the suspend flag was issued recently as part
2157*4882a593Smuzhiyun * of the hwaccess_lock locking. If a suspend occurs *after* that lock
2158*4882a593Smuzhiyun * was taken (i.e. this condition doesn't execute), then the
2159*4882a593Smuzhiyun * kbasep_js_suspend() code will cleanup this context instead (by virtue
2160*4882a593Smuzhiyun * of it being called strictly after the suspend flag is set, and will
2161*4882a593Smuzhiyun * wait for this lock to drop)
2162*4882a593Smuzhiyun */
2163*4882a593Smuzhiyun #ifdef CONFIG_MALI_ARBITER_SUPPORT
2164*4882a593Smuzhiyun if (kbase_pm_is_suspending(kbdev) || kbase_pm_is_gpu_lost(kbdev)) {
2165*4882a593Smuzhiyun #else
2166*4882a593Smuzhiyun if (kbase_pm_is_suspending(kbdev)) {
2167*4882a593Smuzhiyun #endif
2168*4882a593Smuzhiyun /* Cause it to leave at some later point */
2169*4882a593Smuzhiyun bool retained;
2170*4882a593Smuzhiyun CSTD_UNUSED(retained);
2171*4882a593Smuzhiyun
2172*4882a593Smuzhiyun retained = kbase_ctx_sched_inc_refcount_nolock(kctx);
2173*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(retained);
2174*4882a593Smuzhiyun
2175*4882a593Smuzhiyun kbasep_js_clear_submit_allowed(js_devdata, kctx);
2176*4882a593Smuzhiyun kctx_suspended = true;
2177*4882a593Smuzhiyun }
2178*4882a593Smuzhiyun
2179*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_PULLED_SINCE_ACTIVE_JS0 << js);
2180*4882a593Smuzhiyun
2181*4882a593Smuzhiyun /* Transaction complete */
2182*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2183*4882a593Smuzhiyun mutex_unlock(&kbdev->mmu_hw_mutex);
2184*4882a593Smuzhiyun
2185*4882a593Smuzhiyun /* Synchronize with any timers */
2186*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
2187*4882a593Smuzhiyun
2188*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
2189*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2190*4882a593Smuzhiyun /* Note: after this point, the context could potentially get scheduled
2191*4882a593Smuzhiyun * out immediately
2192*4882a593Smuzhiyun */
2193*4882a593Smuzhiyun
2194*4882a593Smuzhiyun if (kctx_suspended) {
2195*4882a593Smuzhiyun /* Finishing forcing out the context due to a suspend. Use a
2196*4882a593Smuzhiyun * variant of kbasep_js_runpool_release_ctx() that doesn't
2197*4882a593Smuzhiyun * schedule a new context, to prevent a risk of recursion back
2198*4882a593Smuzhiyun * into this function
2199*4882a593Smuzhiyun */
2200*4882a593Smuzhiyun kbasep_js_runpool_release_ctx_no_schedule(kbdev, kctx);
2201*4882a593Smuzhiyun return false;
2202*4882a593Smuzhiyun }
2203*4882a593Smuzhiyun return true;
2204*4882a593Smuzhiyun }
2205*4882a593Smuzhiyun
2206*4882a593Smuzhiyun static bool kbase_js_use_ctx(struct kbase_device *kbdev, struct kbase_context *kctx,
2207*4882a593Smuzhiyun unsigned int js)
2208*4882a593Smuzhiyun {
2209*4882a593Smuzhiyun unsigned long flags;
2210*4882a593Smuzhiyun
2211*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2212*4882a593Smuzhiyun
2213*4882a593Smuzhiyun if (kbase_ctx_flag(kctx, KCTX_SCHEDULED) &&
2214*4882a593Smuzhiyun kbase_backend_use_ctx_sched(kbdev, kctx, js)) {
2215*4882a593Smuzhiyun dev_dbg(kbdev->dev, "kctx %pK already has ASID - mark as active (s:%u)\n",
2216*4882a593Smuzhiyun (void *)kctx, js);
2217*4882a593Smuzhiyun
2218*4882a593Smuzhiyun if (kbdev->hwaccess.active_kctx[js] != kctx) {
2219*4882a593Smuzhiyun kbdev->hwaccess.active_kctx[js] = kctx;
2220*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx,
2221*4882a593Smuzhiyun KCTX_PULLED_SINCE_ACTIVE_JS0 << js);
2222*4882a593Smuzhiyun }
2223*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2224*4882a593Smuzhiyun return true; /* Context already scheduled */
2225*4882a593Smuzhiyun }
2226*4882a593Smuzhiyun
2227*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2228*4882a593Smuzhiyun return kbasep_js_schedule_ctx(kbdev, kctx, js);
2229*4882a593Smuzhiyun }
2230*4882a593Smuzhiyun
2231*4882a593Smuzhiyun void kbasep_js_schedule_privileged_ctx(struct kbase_device *kbdev,
2232*4882a593Smuzhiyun struct kbase_context *kctx)
2233*4882a593Smuzhiyun {
2234*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
2235*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
2236*4882a593Smuzhiyun bool is_scheduled;
2237*4882a593Smuzhiyun
2238*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev != NULL);
2239*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
2240*4882a593Smuzhiyun
2241*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
2242*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
2243*4882a593Smuzhiyun
2244*4882a593Smuzhiyun #ifdef CONFIG_MALI_ARBITER_SUPPORT
2245*4882a593Smuzhiyun /* This should only happen in response to a system call
2246*4882a593Smuzhiyun * from a user-space thread.
2247*4882a593Smuzhiyun * In a non-arbitrated environment this can never happen
2248*4882a593Smuzhiyun * whilst suspending.
2249*4882a593Smuzhiyun *
2250*4882a593Smuzhiyun * In an arbitrated environment, user-space threads can run
2251*4882a593Smuzhiyun * while we are suspended (for example GPU not available
2252*4882a593Smuzhiyun * to this VM), however in that case we will block on
2253*4882a593Smuzhiyun * the wait event for KCTX_SCHEDULED, since no context
2254*4882a593Smuzhiyun * can be scheduled until we have the GPU again.
2255*4882a593Smuzhiyun */
2256*4882a593Smuzhiyun if (kbdev->arb.arb_if == NULL)
2257*4882a593Smuzhiyun if (WARN_ON(kbase_pm_is_suspending(kbdev)))
2258*4882a593Smuzhiyun return;
2259*4882a593Smuzhiyun #else
2260*4882a593Smuzhiyun /* This should only happen in response to a system call
2261*4882a593Smuzhiyun * from a user-space thread.
2262*4882a593Smuzhiyun * In a non-arbitrated environment this can never happen
2263*4882a593Smuzhiyun * whilst suspending.
2264*4882a593Smuzhiyun */
2265*4882a593Smuzhiyun if (WARN_ON(kbase_pm_is_suspending(kbdev)))
2266*4882a593Smuzhiyun return;
2267*4882a593Smuzhiyun #endif
2268*4882a593Smuzhiyun
2269*4882a593Smuzhiyun mutex_lock(&js_devdata->queue_mutex);
2270*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
2271*4882a593Smuzhiyun
2272*4882a593Smuzhiyun /* Mark the context as privileged */
2273*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_PRIVILEGED);
2274*4882a593Smuzhiyun
2275*4882a593Smuzhiyun is_scheduled = kbase_ctx_flag(kctx, KCTX_SCHEDULED);
2276*4882a593Smuzhiyun if (!is_scheduled) {
2277*4882a593Smuzhiyun /* Add the context to the pullable list */
2278*4882a593Smuzhiyun if (kbase_js_ctx_list_add_pullable_head(kbdev, kctx, 0))
2279*4882a593Smuzhiyun kbase_js_sync_timers(kbdev);
2280*4882a593Smuzhiyun
2281*4882a593Smuzhiyun /* Fast-starting requires the jsctx_mutex to be dropped,
2282*4882a593Smuzhiyun * because it works on multiple ctxs
2283*4882a593Smuzhiyun */
2284*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2285*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
2286*4882a593Smuzhiyun
2287*4882a593Smuzhiyun /* Try to schedule the context in */
2288*4882a593Smuzhiyun kbase_js_sched_all(kbdev);
2289*4882a593Smuzhiyun
2290*4882a593Smuzhiyun /* Wait for the context to be scheduled in */
2291*4882a593Smuzhiyun wait_event(kctx->jctx.sched_info.ctx.is_scheduled_wait,
2292*4882a593Smuzhiyun kbase_ctx_flag(kctx, KCTX_SCHEDULED));
2293*4882a593Smuzhiyun } else {
2294*4882a593Smuzhiyun /* Already scheduled in - We need to retain it to keep the
2295*4882a593Smuzhiyun * corresponding address space
2296*4882a593Smuzhiyun */
2297*4882a593Smuzhiyun WARN_ON(!kbase_ctx_sched_inc_refcount(kctx));
2298*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2299*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
2300*4882a593Smuzhiyun }
2301*4882a593Smuzhiyun }
2302*4882a593Smuzhiyun KBASE_EXPORT_TEST_API(kbasep_js_schedule_privileged_ctx);
2303*4882a593Smuzhiyun
2304*4882a593Smuzhiyun void kbasep_js_release_privileged_ctx(struct kbase_device *kbdev,
2305*4882a593Smuzhiyun struct kbase_context *kctx)
2306*4882a593Smuzhiyun {
2307*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
2308*4882a593Smuzhiyun
2309*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx != NULL);
2310*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
2311*4882a593Smuzhiyun
2312*4882a593Smuzhiyun /* We don't need to use the address space anymore */
2313*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
2314*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_PRIVILEGED);
2315*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2316*4882a593Smuzhiyun
2317*4882a593Smuzhiyun /* Release the context - it will be scheduled out */
2318*4882a593Smuzhiyun kbasep_js_runpool_release_ctx(kbdev, kctx);
2319*4882a593Smuzhiyun
2320*4882a593Smuzhiyun kbase_js_sched_all(kbdev);
2321*4882a593Smuzhiyun }
2322*4882a593Smuzhiyun KBASE_EXPORT_TEST_API(kbasep_js_release_privileged_ctx);
2323*4882a593Smuzhiyun
2324*4882a593Smuzhiyun void kbasep_js_suspend(struct kbase_device *kbdev)
2325*4882a593Smuzhiyun {
2326*4882a593Smuzhiyun unsigned long flags;
2327*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
2328*4882a593Smuzhiyun int i;
2329*4882a593Smuzhiyun u16 retained = 0u;
2330*4882a593Smuzhiyun
2331*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev);
2332*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbase_pm_is_suspending(kbdev));
2333*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
2334*4882a593Smuzhiyun
2335*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2336*4882a593Smuzhiyun
2337*4882a593Smuzhiyun /* Prevent all contexts from submitting */
2338*4882a593Smuzhiyun js_devdata->runpool_irq.submit_allowed = 0;
2339*4882a593Smuzhiyun
2340*4882a593Smuzhiyun /* Retain each of the contexts, so we can cause it to leave even if it
2341*4882a593Smuzhiyun * had no refcount to begin with
2342*4882a593Smuzhiyun */
2343*4882a593Smuzhiyun for (i = BASE_MAX_NR_AS - 1; i >= 0; --i) {
2344*4882a593Smuzhiyun struct kbase_context *kctx = kbdev->as_to_kctx[i];
2345*4882a593Smuzhiyun
2346*4882a593Smuzhiyun retained = retained << 1;
2347*4882a593Smuzhiyun
2348*4882a593Smuzhiyun if (kctx && !(kbdev->as_free & (1u << i))) {
2349*4882a593Smuzhiyun kbase_ctx_sched_retain_ctx_refcount(kctx);
2350*4882a593Smuzhiyun retained |= 1u;
2351*4882a593Smuzhiyun /* This loop will not have an effect on the privileged
2352*4882a593Smuzhiyun * contexts as they would have an extra ref count
2353*4882a593Smuzhiyun * compared to the normal contexts, so they will hold
2354*4882a593Smuzhiyun * on to their address spaces. MMU will re-enabled for
2355*4882a593Smuzhiyun * them on resume.
2356*4882a593Smuzhiyun */
2357*4882a593Smuzhiyun }
2358*4882a593Smuzhiyun }
2359*4882a593Smuzhiyun
2360*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2361*4882a593Smuzhiyun
2362*4882a593Smuzhiyun /* De-ref the previous retain to ensure each context gets pulled out
2363*4882a593Smuzhiyun * sometime later.
2364*4882a593Smuzhiyun */
2365*4882a593Smuzhiyun for (i = 0;
2366*4882a593Smuzhiyun i < BASE_MAX_NR_AS;
2367*4882a593Smuzhiyun ++i, retained = retained >> 1) {
2368*4882a593Smuzhiyun struct kbase_context *kctx = kbdev->as_to_kctx[i];
2369*4882a593Smuzhiyun
2370*4882a593Smuzhiyun if (retained & 1u)
2371*4882a593Smuzhiyun kbasep_js_runpool_release_ctx(kbdev, kctx);
2372*4882a593Smuzhiyun }
2373*4882a593Smuzhiyun
2374*4882a593Smuzhiyun /* Caller must wait for all Power Manager active references to be
2375*4882a593Smuzhiyun * dropped
2376*4882a593Smuzhiyun */
2377*4882a593Smuzhiyun }
2378*4882a593Smuzhiyun
2379*4882a593Smuzhiyun void kbasep_js_resume(struct kbase_device *kbdev)
2380*4882a593Smuzhiyun {
2381*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
2382*4882a593Smuzhiyun int js, prio;
2383*4882a593Smuzhiyun
2384*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kbdev);
2385*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
2386*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(!kbase_pm_is_suspending(kbdev));
2387*4882a593Smuzhiyun
2388*4882a593Smuzhiyun mutex_lock(&js_devdata->queue_mutex);
2389*4882a593Smuzhiyun for (js = 0; js < kbdev->gpu_props.num_job_slots; js++) {
2390*4882a593Smuzhiyun for (prio = KBASE_JS_ATOM_SCHED_PRIO_FIRST;
2391*4882a593Smuzhiyun prio < KBASE_JS_ATOM_SCHED_PRIO_COUNT; prio++) {
2392*4882a593Smuzhiyun struct kbase_context *kctx, *n;
2393*4882a593Smuzhiyun unsigned long flags;
2394*4882a593Smuzhiyun
2395*4882a593Smuzhiyun #ifndef CONFIG_MALI_ARBITER_SUPPORT
2396*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2397*4882a593Smuzhiyun
2398*4882a593Smuzhiyun list_for_each_entry_safe(kctx, n,
2399*4882a593Smuzhiyun &kbdev->js_data.ctx_list_unpullable[js][prio],
2400*4882a593Smuzhiyun jctx.sched_info.ctx.ctx_list_entry[js]) {
2401*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
2402*4882a593Smuzhiyun bool timer_sync = false;
2403*4882a593Smuzhiyun
2404*4882a593Smuzhiyun /* Drop lock so we can take kctx mutexes */
2405*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock,
2406*4882a593Smuzhiyun flags);
2407*4882a593Smuzhiyun
2408*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
2409*4882a593Smuzhiyun
2410*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
2411*4882a593Smuzhiyun mutex_lock(&js_devdata->runpool_mutex);
2412*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2413*4882a593Smuzhiyun
2414*4882a593Smuzhiyun if (!kbase_ctx_flag(kctx, KCTX_SCHEDULED) &&
2415*4882a593Smuzhiyun kbase_js_ctx_pullable(kctx, js, false))
2416*4882a593Smuzhiyun timer_sync =
2417*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
2418*4882a593Smuzhiyun kbdev, kctx, js);
2419*4882a593Smuzhiyun
2420*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock,
2421*4882a593Smuzhiyun flags);
2422*4882a593Smuzhiyun
2423*4882a593Smuzhiyun if (timer_sync)
2424*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
2425*4882a593Smuzhiyun
2426*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
2427*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
2428*4882a593Smuzhiyun
2429*4882a593Smuzhiyun /* Take lock before accessing list again */
2430*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2431*4882a593Smuzhiyun }
2432*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2433*4882a593Smuzhiyun #else
2434*4882a593Smuzhiyun bool timer_sync = false;
2435*4882a593Smuzhiyun
2436*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2437*4882a593Smuzhiyun
2438*4882a593Smuzhiyun list_for_each_entry_safe(kctx, n,
2439*4882a593Smuzhiyun &kbdev->js_data.ctx_list_unpullable[js][prio],
2440*4882a593Smuzhiyun jctx.sched_info.ctx.ctx_list_entry[js]) {
2441*4882a593Smuzhiyun
2442*4882a593Smuzhiyun if (!kbase_ctx_flag(kctx, KCTX_SCHEDULED) &&
2443*4882a593Smuzhiyun kbase_js_ctx_pullable(kctx, js, false))
2444*4882a593Smuzhiyun timer_sync |=
2445*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
2446*4882a593Smuzhiyun kbdev, kctx, js);
2447*4882a593Smuzhiyun }
2448*4882a593Smuzhiyun
2449*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2450*4882a593Smuzhiyun
2451*4882a593Smuzhiyun if (timer_sync) {
2452*4882a593Smuzhiyun mutex_lock(&js_devdata->runpool_mutex);
2453*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
2454*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
2455*4882a593Smuzhiyun }
2456*4882a593Smuzhiyun #endif
2457*4882a593Smuzhiyun }
2458*4882a593Smuzhiyun }
2459*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
2460*4882a593Smuzhiyun
2461*4882a593Smuzhiyun /* Restart atom processing */
2462*4882a593Smuzhiyun kbase_js_sched_all(kbdev);
2463*4882a593Smuzhiyun
2464*4882a593Smuzhiyun /* JS Resume complete */
2465*4882a593Smuzhiyun }
2466*4882a593Smuzhiyun
2467*4882a593Smuzhiyun bool kbase_js_is_atom_valid(struct kbase_device *kbdev,
2468*4882a593Smuzhiyun struct kbase_jd_atom *katom)
2469*4882a593Smuzhiyun {
2470*4882a593Smuzhiyun if ((katom->core_req & BASE_JD_REQ_FS) &&
2471*4882a593Smuzhiyun (katom->core_req & (BASE_JD_REQ_CS | BASE_JD_REQ_ONLY_COMPUTE |
2472*4882a593Smuzhiyun BASE_JD_REQ_T)))
2473*4882a593Smuzhiyun return false;
2474*4882a593Smuzhiyun
2475*4882a593Smuzhiyun if ((katom->core_req & BASE_JD_REQ_JOB_SLOT) &&
2476*4882a593Smuzhiyun (katom->jobslot >= BASE_JM_MAX_NR_SLOTS))
2477*4882a593Smuzhiyun return false;
2478*4882a593Smuzhiyun
2479*4882a593Smuzhiyun return true;
2480*4882a593Smuzhiyun }
2481*4882a593Smuzhiyun
2482*4882a593Smuzhiyun static unsigned int kbase_js_get_slot(struct kbase_device *kbdev, struct kbase_jd_atom *katom)
2483*4882a593Smuzhiyun {
2484*4882a593Smuzhiyun if (katom->core_req & BASE_JD_REQ_JOB_SLOT)
2485*4882a593Smuzhiyun return katom->jobslot;
2486*4882a593Smuzhiyun
2487*4882a593Smuzhiyun if (katom->core_req & BASE_JD_REQ_FS)
2488*4882a593Smuzhiyun return 0;
2489*4882a593Smuzhiyun
2490*4882a593Smuzhiyun if (katom->core_req & BASE_JD_REQ_ONLY_COMPUTE) {
2491*4882a593Smuzhiyun if (katom->device_nr == 1 &&
2492*4882a593Smuzhiyun kbdev->gpu_props.num_core_groups == 2)
2493*4882a593Smuzhiyun return 2;
2494*4882a593Smuzhiyun }
2495*4882a593Smuzhiyun
2496*4882a593Smuzhiyun return 1;
2497*4882a593Smuzhiyun }
2498*4882a593Smuzhiyun
2499*4882a593Smuzhiyun bool kbase_js_dep_resolved_submit(struct kbase_context *kctx,
2500*4882a593Smuzhiyun struct kbase_jd_atom *katom)
2501*4882a593Smuzhiyun {
2502*4882a593Smuzhiyun bool enqueue_required, add_required = true;
2503*4882a593Smuzhiyun
2504*4882a593Smuzhiyun katom->slot_nr = kbase_js_get_slot(kctx->kbdev, katom);
2505*4882a593Smuzhiyun
2506*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
2507*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
2508*4882a593Smuzhiyun
2509*4882a593Smuzhiyun /* If slot will transition from unpullable to pullable then add to
2510*4882a593Smuzhiyun * pullable list
2511*4882a593Smuzhiyun */
2512*4882a593Smuzhiyun if (jsctx_rb_none_to_pull(kctx, katom->slot_nr))
2513*4882a593Smuzhiyun enqueue_required = true;
2514*4882a593Smuzhiyun else
2515*4882a593Smuzhiyun enqueue_required = false;
2516*4882a593Smuzhiyun
2517*4882a593Smuzhiyun if ((katom->atom_flags & KBASE_KATOM_FLAG_X_DEP_BLOCKED) ||
2518*4882a593Smuzhiyun (katom->pre_dep && (katom->pre_dep->atom_flags &
2519*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST))) {
2520*4882a593Smuzhiyun int prio = katom->sched_priority;
2521*4882a593Smuzhiyun unsigned int js = katom->slot_nr;
2522*4882a593Smuzhiyun struct jsctx_queue *queue = &kctx->jsctx_queue[prio][js];
2523*4882a593Smuzhiyun
2524*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Add atom %pK to X_DEP list (s:%u)\n", (void *)katom, js);
2525*4882a593Smuzhiyun
2526*4882a593Smuzhiyun list_add_tail(&katom->queue, &queue->x_dep_head);
2527*4882a593Smuzhiyun katom->atom_flags |= KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST;
2528*4882a593Smuzhiyun if (kbase_js_atom_blocked_on_x_dep(katom)) {
2529*4882a593Smuzhiyun enqueue_required = false;
2530*4882a593Smuzhiyun add_required = false;
2531*4882a593Smuzhiyun }
2532*4882a593Smuzhiyun } else {
2533*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Atom %pK not added to X_DEP list\n",
2534*4882a593Smuzhiyun (void *)katom);
2535*4882a593Smuzhiyun }
2536*4882a593Smuzhiyun
2537*4882a593Smuzhiyun if (add_required) {
2538*4882a593Smuzhiyun /* Check if there are lower priority jobs to soft stop */
2539*4882a593Smuzhiyun kbase_job_slot_ctx_priority_check_locked(kctx, katom);
2540*4882a593Smuzhiyun
2541*4882a593Smuzhiyun /* Add atom to ring buffer. */
2542*4882a593Smuzhiyun jsctx_tree_add(kctx, katom);
2543*4882a593Smuzhiyun katom->atom_flags |= KBASE_KATOM_FLAG_JSCTX_IN_TREE;
2544*4882a593Smuzhiyun }
2545*4882a593Smuzhiyun
2546*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
2547*4882a593Smuzhiyun "Enqueue of kctx %pK is %srequired to submit atom %pK\n",
2548*4882a593Smuzhiyun kctx, enqueue_required ? "" : "not ", katom);
2549*4882a593Smuzhiyun
2550*4882a593Smuzhiyun return enqueue_required;
2551*4882a593Smuzhiyun }
2552*4882a593Smuzhiyun
2553*4882a593Smuzhiyun /**
2554*4882a593Smuzhiyun * kbase_js_move_to_tree - Move atom (and any dependent atoms) to the
2555*4882a593Smuzhiyun * runnable_tree, ready for execution
2556*4882a593Smuzhiyun * @katom: Atom to submit
2557*4882a593Smuzhiyun *
2558*4882a593Smuzhiyun * It is assumed that @katom does not have KBASE_KATOM_FLAG_X_DEP_BLOCKED set,
2559*4882a593Smuzhiyun * but is still present in the x_dep list. If @katom has a same-slot dependent
2560*4882a593Smuzhiyun * atom then that atom (and any dependents) will also be moved.
2561*4882a593Smuzhiyun */
2562*4882a593Smuzhiyun static void kbase_js_move_to_tree(struct kbase_jd_atom *katom)
2563*4882a593Smuzhiyun {
2564*4882a593Smuzhiyun struct kbase_context *const kctx = katom->kctx;
2565*4882a593Smuzhiyun
2566*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
2567*4882a593Smuzhiyun
2568*4882a593Smuzhiyun while (katom) {
2569*4882a593Smuzhiyun WARN_ON(!(katom->atom_flags &
2570*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST));
2571*4882a593Smuzhiyun
2572*4882a593Smuzhiyun if (!kbase_js_atom_blocked_on_x_dep(katom)) {
2573*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
2574*4882a593Smuzhiyun "Del atom %pK from X_DEP list in js_move_to_tree\n",
2575*4882a593Smuzhiyun (void *)katom);
2576*4882a593Smuzhiyun
2577*4882a593Smuzhiyun list_del(&katom->queue);
2578*4882a593Smuzhiyun katom->atom_flags &=
2579*4882a593Smuzhiyun ~KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST;
2580*4882a593Smuzhiyun /* For incremental rendering, an end-of-renderpass atom
2581*4882a593Smuzhiyun * may have had its dependency on start-of-renderpass
2582*4882a593Smuzhiyun * ignored and may therefore already be in the tree.
2583*4882a593Smuzhiyun */
2584*4882a593Smuzhiyun if (!(katom->atom_flags &
2585*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_TREE)) {
2586*4882a593Smuzhiyun jsctx_tree_add(kctx, katom);
2587*4882a593Smuzhiyun katom->atom_flags |=
2588*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_TREE;
2589*4882a593Smuzhiyun }
2590*4882a593Smuzhiyun } else {
2591*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
2592*4882a593Smuzhiyun "Atom %pK blocked on x-dep in js_move_to_tree\n",
2593*4882a593Smuzhiyun (void *)katom);
2594*4882a593Smuzhiyun break;
2595*4882a593Smuzhiyun }
2596*4882a593Smuzhiyun
2597*4882a593Smuzhiyun katom = katom->post_dep;
2598*4882a593Smuzhiyun }
2599*4882a593Smuzhiyun }
2600*4882a593Smuzhiyun
2601*4882a593Smuzhiyun
2602*4882a593Smuzhiyun /**
2603*4882a593Smuzhiyun * kbase_js_evict_deps - Evict dependencies of a failed atom.
2604*4882a593Smuzhiyun * @kctx: Context pointer
2605*4882a593Smuzhiyun * @katom: Pointer to the atom that has failed.
2606*4882a593Smuzhiyun * @js: The job slot the katom was run on.
2607*4882a593Smuzhiyun * @prio: Priority of the katom.
2608*4882a593Smuzhiyun *
2609*4882a593Smuzhiyun * Remove all post dependencies of an atom from the context ringbuffers.
2610*4882a593Smuzhiyun *
2611*4882a593Smuzhiyun * The original atom's event_code will be propogated to all dependent atoms.
2612*4882a593Smuzhiyun *
2613*4882a593Smuzhiyun * Context: Caller must hold the HW access lock
2614*4882a593Smuzhiyun */
2615*4882a593Smuzhiyun static void kbase_js_evict_deps(struct kbase_context *kctx, struct kbase_jd_atom *katom,
2616*4882a593Smuzhiyun unsigned int js, int prio)
2617*4882a593Smuzhiyun {
2618*4882a593Smuzhiyun struct kbase_jd_atom *x_dep = katom->x_post_dep;
2619*4882a593Smuzhiyun struct kbase_jd_atom *next_katom = katom->post_dep;
2620*4882a593Smuzhiyun
2621*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
2622*4882a593Smuzhiyun
2623*4882a593Smuzhiyun if (next_katom) {
2624*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(next_katom->status !=
2625*4882a593Smuzhiyun KBASE_JD_ATOM_STATE_HW_COMPLETED);
2626*4882a593Smuzhiyun next_katom->will_fail_event_code = katom->event_code;
2627*4882a593Smuzhiyun
2628*4882a593Smuzhiyun }
2629*4882a593Smuzhiyun
2630*4882a593Smuzhiyun /* Has cross slot depenency. */
2631*4882a593Smuzhiyun if (x_dep && (x_dep->atom_flags & (KBASE_KATOM_FLAG_JSCTX_IN_TREE |
2632*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST))) {
2633*4882a593Smuzhiyun /* Remove dependency.*/
2634*4882a593Smuzhiyun x_dep->atom_flags &= ~KBASE_KATOM_FLAG_X_DEP_BLOCKED;
2635*4882a593Smuzhiyun
2636*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Cleared X_DEP flag on atom %pK\n",
2637*4882a593Smuzhiyun (void *)x_dep);
2638*4882a593Smuzhiyun
2639*4882a593Smuzhiyun /* Fail if it had a data dependency. */
2640*4882a593Smuzhiyun if (x_dep->atom_flags & KBASE_KATOM_FLAG_FAIL_BLOCKER)
2641*4882a593Smuzhiyun x_dep->will_fail_event_code = katom->event_code;
2642*4882a593Smuzhiyun
2643*4882a593Smuzhiyun if (x_dep->atom_flags & KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST)
2644*4882a593Smuzhiyun kbase_js_move_to_tree(x_dep);
2645*4882a593Smuzhiyun }
2646*4882a593Smuzhiyun }
2647*4882a593Smuzhiyun
2648*4882a593Smuzhiyun struct kbase_jd_atom *kbase_js_pull(struct kbase_context *kctx, unsigned int js)
2649*4882a593Smuzhiyun {
2650*4882a593Smuzhiyun struct kbase_jd_atom *katom;
2651*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
2652*4882a593Smuzhiyun struct kbase_device *kbdev;
2653*4882a593Smuzhiyun int pulled;
2654*4882a593Smuzhiyun
2655*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(kctx);
2656*4882a593Smuzhiyun
2657*4882a593Smuzhiyun kbdev = kctx->kbdev;
2658*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: pulling an atom from kctx %pK (s:%u)\n", (void *)kctx, js);
2659*4882a593Smuzhiyun
2660*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
2661*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
2662*4882a593Smuzhiyun
2663*4882a593Smuzhiyun if (!kbasep_js_is_submit_allowed(js_devdata, kctx)) {
2664*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: No submit allowed for kctx %pK\n",
2665*4882a593Smuzhiyun (void *)kctx);
2666*4882a593Smuzhiyun return NULL;
2667*4882a593Smuzhiyun }
2668*4882a593Smuzhiyun #ifdef CONFIG_MALI_ARBITER_SUPPORT
2669*4882a593Smuzhiyun if (kbase_pm_is_suspending(kbdev) || kbase_pm_is_gpu_lost(kbdev))
2670*4882a593Smuzhiyun #else
2671*4882a593Smuzhiyun if (kbase_pm_is_suspending(kbdev))
2672*4882a593Smuzhiyun #endif
2673*4882a593Smuzhiyun return NULL;
2674*4882a593Smuzhiyun
2675*4882a593Smuzhiyun katom = jsctx_rb_peek(kctx, js);
2676*4882a593Smuzhiyun if (!katom) {
2677*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: No pullable atom in kctx %pK (s:%u)\n", (void *)kctx, js);
2678*4882a593Smuzhiyun return NULL;
2679*4882a593Smuzhiyun }
2680*4882a593Smuzhiyun if (kbase_jsctx_slot_prio_is_blocked(kctx, js, katom->sched_priority)) {
2681*4882a593Smuzhiyun dev_dbg(kbdev->dev,
2682*4882a593Smuzhiyun "JS: kctx %pK is blocked from submitting atoms at priority %d and lower (s:%u)\n",
2683*4882a593Smuzhiyun (void *)kctx, katom->sched_priority, js);
2684*4882a593Smuzhiyun return NULL;
2685*4882a593Smuzhiyun }
2686*4882a593Smuzhiyun if (atomic_read(&katom->blocked)) {
2687*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: Atom %pK is blocked in js_pull\n",
2688*4882a593Smuzhiyun (void *)katom);
2689*4882a593Smuzhiyun return NULL;
2690*4882a593Smuzhiyun }
2691*4882a593Smuzhiyun
2692*4882a593Smuzhiyun /* Due to ordering restrictions when unpulling atoms on failure, we do
2693*4882a593Smuzhiyun * not allow multiple runs of fail-dep atoms from the same context to be
2694*4882a593Smuzhiyun * present on the same slot
2695*4882a593Smuzhiyun */
2696*4882a593Smuzhiyun if (katom->pre_dep && kbase_jsctx_slot_atoms_pulled(kctx, js)) {
2697*4882a593Smuzhiyun struct kbase_jd_atom *prev_atom =
2698*4882a593Smuzhiyun kbase_backend_inspect_tail(kbdev, js);
2699*4882a593Smuzhiyun
2700*4882a593Smuzhiyun if (prev_atom && prev_atom->kctx != kctx)
2701*4882a593Smuzhiyun return NULL;
2702*4882a593Smuzhiyun }
2703*4882a593Smuzhiyun
2704*4882a593Smuzhiyun if (kbase_js_atom_blocked_on_x_dep(katom)) {
2705*4882a593Smuzhiyun if (katom->x_pre_dep->gpu_rb_state ==
2706*4882a593Smuzhiyun KBASE_ATOM_GPU_RB_NOT_IN_SLOT_RB ||
2707*4882a593Smuzhiyun katom->x_pre_dep->will_fail_event_code) {
2708*4882a593Smuzhiyun dev_dbg(kbdev->dev,
2709*4882a593Smuzhiyun "JS: X pre-dep %pK is not present in slot FIFO or will fail\n",
2710*4882a593Smuzhiyun (void *)katom->x_pre_dep);
2711*4882a593Smuzhiyun return NULL;
2712*4882a593Smuzhiyun }
2713*4882a593Smuzhiyun if ((katom->atom_flags & KBASE_KATOM_FLAG_FAIL_BLOCKER) &&
2714*4882a593Smuzhiyun kbase_backend_nr_atoms_on_slot(kbdev, js)) {
2715*4882a593Smuzhiyun dev_dbg(kbdev->dev,
2716*4882a593Smuzhiyun "JS: Atom %pK has cross-slot fail dependency and atoms on slot (s:%u)\n",
2717*4882a593Smuzhiyun (void *)katom, js);
2718*4882a593Smuzhiyun return NULL;
2719*4882a593Smuzhiyun }
2720*4882a593Smuzhiyun }
2721*4882a593Smuzhiyun
2722*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_SLOT_INFO(kbdev, JS_PULL_JOB, kctx, katom,
2723*4882a593Smuzhiyun katom->jc, js, katom->sched_priority);
2724*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_PULLED);
2725*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, (KCTX_PULLED_SINCE_ACTIVE_JS0 << js));
2726*4882a593Smuzhiyun
2727*4882a593Smuzhiyun pulled = kbase_jsctx_slot_atom_pulled_inc(kctx, katom);
2728*4882a593Smuzhiyun if (pulled == 1 && !kctx->slots_pullable) {
2729*4882a593Smuzhiyun WARN_ON(kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF));
2730*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_RUNNABLE_REF);
2731*4882a593Smuzhiyun atomic_inc(&kbdev->js_data.nr_contexts_runnable);
2732*4882a593Smuzhiyun }
2733*4882a593Smuzhiyun jsctx_rb_pull(kctx, katom);
2734*4882a593Smuzhiyun
2735*4882a593Smuzhiyun kbase_ctx_sched_retain_ctx_refcount(kctx);
2736*4882a593Smuzhiyun
2737*4882a593Smuzhiyun katom->ticks = 0;
2738*4882a593Smuzhiyun
2739*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: successfully pulled atom %pK from kctx %pK (s:%u)\n",
2740*4882a593Smuzhiyun (void *)katom, (void *)kctx, js);
2741*4882a593Smuzhiyun
2742*4882a593Smuzhiyun return katom;
2743*4882a593Smuzhiyun }
2744*4882a593Smuzhiyun
2745*4882a593Smuzhiyun /**
2746*4882a593Smuzhiyun * js_return_of_start_rp() - Handle soft-stop of an atom that starts a
2747*4882a593Smuzhiyun * renderpass
2748*4882a593Smuzhiyun * @start_katom: Pointer to the start-of-renderpass atom that was soft-stopped
2749*4882a593Smuzhiyun *
2750*4882a593Smuzhiyun * This function is called to switch to incremental rendering if the tiler job
2751*4882a593Smuzhiyun * chain at the start of a renderpass has used too much memory. It prevents the
2752*4882a593Smuzhiyun * tiler job being pulled for execution in the job scheduler again until the
2753*4882a593Smuzhiyun * next phase of incremental rendering is complete.
2754*4882a593Smuzhiyun *
2755*4882a593Smuzhiyun * If the end-of-renderpass atom is already in the job scheduler (because a
2756*4882a593Smuzhiyun * previous attempt at tiling used too much memory during the same renderpass)
2757*4882a593Smuzhiyun * then it is unblocked; otherwise, it is run by handing it to the scheduler.
2758*4882a593Smuzhiyun */
2759*4882a593Smuzhiyun static void js_return_of_start_rp(struct kbase_jd_atom *const start_katom)
2760*4882a593Smuzhiyun {
2761*4882a593Smuzhiyun struct kbase_context *const kctx = start_katom->kctx;
2762*4882a593Smuzhiyun struct kbase_device *const kbdev = kctx->kbdev;
2763*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
2764*4882a593Smuzhiyun struct kbase_jd_atom *end_katom;
2765*4882a593Smuzhiyun unsigned long flags;
2766*4882a593Smuzhiyun
2767*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
2768*4882a593Smuzhiyun
2769*4882a593Smuzhiyun if (WARN_ON(!(start_katom->core_req & BASE_JD_REQ_START_RENDERPASS)))
2770*4882a593Smuzhiyun return;
2771*4882a593Smuzhiyun
2772*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(start_katom->renderpass_id) * 8)) <=
2773*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
2774*4882a593Smuzhiyun "Should check invalid access to renderpasses");
2775*4882a593Smuzhiyun
2776*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[start_katom->renderpass_id];
2777*4882a593Smuzhiyun
2778*4882a593Smuzhiyun if (WARN_ON(rp->start_katom != start_katom))
2779*4882a593Smuzhiyun return;
2780*4882a593Smuzhiyun
2781*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
2782*4882a593Smuzhiyun "JS return start atom %pK in state %d of RP %d\n",
2783*4882a593Smuzhiyun (void *)start_katom, (int)rp->state,
2784*4882a593Smuzhiyun start_katom->renderpass_id);
2785*4882a593Smuzhiyun
2786*4882a593Smuzhiyun if (WARN_ON(rp->state == KBASE_JD_RP_COMPLETE))
2787*4882a593Smuzhiyun return;
2788*4882a593Smuzhiyun
2789*4882a593Smuzhiyun /* The tiler job might have been soft-stopped for some reason other
2790*4882a593Smuzhiyun * than running out of memory.
2791*4882a593Smuzhiyun */
2792*4882a593Smuzhiyun if (rp->state == KBASE_JD_RP_START || rp->state == KBASE_JD_RP_RETRY) {
2793*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
2794*4882a593Smuzhiyun "JS return isn't OOM in state %d of RP %d\n",
2795*4882a593Smuzhiyun (int)rp->state, start_katom->renderpass_id);
2796*4882a593Smuzhiyun return;
2797*4882a593Smuzhiyun }
2798*4882a593Smuzhiyun
2799*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
2800*4882a593Smuzhiyun "JS return confirm OOM in state %d of RP %d\n",
2801*4882a593Smuzhiyun (int)rp->state, start_katom->renderpass_id);
2802*4882a593Smuzhiyun
2803*4882a593Smuzhiyun if (WARN_ON(rp->state != KBASE_JD_RP_PEND_OOM &&
2804*4882a593Smuzhiyun rp->state != KBASE_JD_RP_RETRY_PEND_OOM))
2805*4882a593Smuzhiyun return;
2806*4882a593Smuzhiyun
2807*4882a593Smuzhiyun /* Prevent the tiler job being pulled for execution in the
2808*4882a593Smuzhiyun * job scheduler again.
2809*4882a593Smuzhiyun */
2810*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Blocking start atom %pK\n",
2811*4882a593Smuzhiyun (void *)start_katom);
2812*4882a593Smuzhiyun atomic_inc(&start_katom->blocked);
2813*4882a593Smuzhiyun
2814*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2815*4882a593Smuzhiyun
2816*4882a593Smuzhiyun rp->state = (rp->state == KBASE_JD_RP_PEND_OOM) ?
2817*4882a593Smuzhiyun KBASE_JD_RP_OOM : KBASE_JD_RP_RETRY_OOM;
2818*4882a593Smuzhiyun
2819*4882a593Smuzhiyun /* Was the fragment job chain submitted to kbase yet? */
2820*4882a593Smuzhiyun end_katom = rp->end_katom;
2821*4882a593Smuzhiyun if (end_katom) {
2822*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "JS return add end atom %pK\n",
2823*4882a593Smuzhiyun (void *)end_katom);
2824*4882a593Smuzhiyun
2825*4882a593Smuzhiyun if (rp->state == KBASE_JD_RP_RETRY_OOM) {
2826*4882a593Smuzhiyun /* Allow the end of the renderpass to be pulled for
2827*4882a593Smuzhiyun * execution again to continue incremental rendering.
2828*4882a593Smuzhiyun */
2829*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Unblocking end atom %pK\n",
2830*4882a593Smuzhiyun (void *)end_katom);
2831*4882a593Smuzhiyun atomic_dec(&end_katom->blocked);
2832*4882a593Smuzhiyun WARN_ON(!(end_katom->atom_flags &
2833*4882a593Smuzhiyun KBASE_KATOM_FLAG_JSCTX_IN_TREE));
2834*4882a593Smuzhiyun WARN_ON(end_katom->status != KBASE_JD_ATOM_STATE_IN_JS);
2835*4882a593Smuzhiyun
2836*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(kbdev, kctx,
2837*4882a593Smuzhiyun end_katom->slot_nr);
2838*4882a593Smuzhiyun
2839*4882a593Smuzhiyun /* Expect the fragment job chain to be scheduled without
2840*4882a593Smuzhiyun * further action because this function is called when
2841*4882a593Smuzhiyun * returning an atom to the job scheduler ringbuffer.
2842*4882a593Smuzhiyun */
2843*4882a593Smuzhiyun end_katom = NULL;
2844*4882a593Smuzhiyun } else {
2845*4882a593Smuzhiyun WARN_ON(end_katom->status !=
2846*4882a593Smuzhiyun KBASE_JD_ATOM_STATE_QUEUED &&
2847*4882a593Smuzhiyun end_katom->status != KBASE_JD_ATOM_STATE_IN_JS);
2848*4882a593Smuzhiyun }
2849*4882a593Smuzhiyun }
2850*4882a593Smuzhiyun
2851*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2852*4882a593Smuzhiyun
2853*4882a593Smuzhiyun if (end_katom)
2854*4882a593Smuzhiyun kbase_jd_dep_clear_locked(end_katom);
2855*4882a593Smuzhiyun }
2856*4882a593Smuzhiyun
2857*4882a593Smuzhiyun /**
2858*4882a593Smuzhiyun * js_return_of_end_rp() - Handle completion of an atom that ends a renderpass
2859*4882a593Smuzhiyun * @end_katom: Pointer to the end-of-renderpass atom that was completed
2860*4882a593Smuzhiyun *
2861*4882a593Smuzhiyun * This function is called to continue incremental rendering if the tiler job
2862*4882a593Smuzhiyun * chain at the start of a renderpass used too much memory. It resets the
2863*4882a593Smuzhiyun * mechanism for detecting excessive memory usage then allows the soft-stopped
2864*4882a593Smuzhiyun * tiler job chain to be pulled for execution again.
2865*4882a593Smuzhiyun *
2866*4882a593Smuzhiyun * The start-of-renderpass atom must already been submitted to kbase.
2867*4882a593Smuzhiyun */
2868*4882a593Smuzhiyun static void js_return_of_end_rp(struct kbase_jd_atom *const end_katom)
2869*4882a593Smuzhiyun {
2870*4882a593Smuzhiyun struct kbase_context *const kctx = end_katom->kctx;
2871*4882a593Smuzhiyun struct kbase_device *const kbdev = kctx->kbdev;
2872*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
2873*4882a593Smuzhiyun struct kbase_jd_atom *start_katom;
2874*4882a593Smuzhiyun unsigned long flags;
2875*4882a593Smuzhiyun
2876*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
2877*4882a593Smuzhiyun
2878*4882a593Smuzhiyun if (WARN_ON(!(end_katom->core_req & BASE_JD_REQ_END_RENDERPASS)))
2879*4882a593Smuzhiyun return;
2880*4882a593Smuzhiyun
2881*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(end_katom->renderpass_id) * 8)) <=
2882*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
2883*4882a593Smuzhiyun "Should check invalid access to renderpasses");
2884*4882a593Smuzhiyun
2885*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[end_katom->renderpass_id];
2886*4882a593Smuzhiyun
2887*4882a593Smuzhiyun if (WARN_ON(rp->end_katom != end_katom))
2888*4882a593Smuzhiyun return;
2889*4882a593Smuzhiyun
2890*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
2891*4882a593Smuzhiyun "JS return end atom %pK in state %d of RP %d\n",
2892*4882a593Smuzhiyun (void *)end_katom, (int)rp->state, end_katom->renderpass_id);
2893*4882a593Smuzhiyun
2894*4882a593Smuzhiyun if (WARN_ON(rp->state != KBASE_JD_RP_OOM &&
2895*4882a593Smuzhiyun rp->state != KBASE_JD_RP_RETRY_OOM))
2896*4882a593Smuzhiyun return;
2897*4882a593Smuzhiyun
2898*4882a593Smuzhiyun /* Reduce the number of mapped pages in the memory regions that
2899*4882a593Smuzhiyun * triggered out-of-memory last time so that we can detect excessive
2900*4882a593Smuzhiyun * memory usage again.
2901*4882a593Smuzhiyun */
2902*4882a593Smuzhiyun kbase_gpu_vm_lock(kctx);
2903*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2904*4882a593Smuzhiyun
2905*4882a593Smuzhiyun while (!list_empty(&rp->oom_reg_list)) {
2906*4882a593Smuzhiyun struct kbase_va_region *reg =
2907*4882a593Smuzhiyun list_first_entry(&rp->oom_reg_list,
2908*4882a593Smuzhiyun struct kbase_va_region, link);
2909*4882a593Smuzhiyun
2910*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2911*4882a593Smuzhiyun
2912*4882a593Smuzhiyun dev_dbg(kbdev->dev,
2913*4882a593Smuzhiyun "Reset backing to %zu pages for region %pK\n",
2914*4882a593Smuzhiyun reg->threshold_pages, (void *)reg);
2915*4882a593Smuzhiyun
2916*4882a593Smuzhiyun if (!WARN_ON(reg->flags & KBASE_REG_VA_FREED))
2917*4882a593Smuzhiyun kbase_mem_shrink(kctx, reg, reg->threshold_pages);
2918*4882a593Smuzhiyun
2919*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2920*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Deleting region %pK from list\n",
2921*4882a593Smuzhiyun (void *)reg);
2922*4882a593Smuzhiyun list_del_init(®->link);
2923*4882a593Smuzhiyun kbase_va_region_alloc_put(kctx, reg);
2924*4882a593Smuzhiyun }
2925*4882a593Smuzhiyun
2926*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2927*4882a593Smuzhiyun kbase_gpu_vm_unlock(kctx);
2928*4882a593Smuzhiyun
2929*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2930*4882a593Smuzhiyun rp->state = KBASE_JD_RP_RETRY;
2931*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Changed state to %d for retry\n", rp->state);
2932*4882a593Smuzhiyun
2933*4882a593Smuzhiyun /* Allow the start of the renderpass to be pulled for execution again
2934*4882a593Smuzhiyun * to begin/continue incremental rendering.
2935*4882a593Smuzhiyun */
2936*4882a593Smuzhiyun start_katom = rp->start_katom;
2937*4882a593Smuzhiyun if (!WARN_ON(!start_katom)) {
2938*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Unblocking start atom %pK\n",
2939*4882a593Smuzhiyun (void *)start_katom);
2940*4882a593Smuzhiyun atomic_dec(&start_katom->blocked);
2941*4882a593Smuzhiyun (void)kbase_js_ctx_list_add_pullable_head_nolock(kbdev, kctx,
2942*4882a593Smuzhiyun start_katom->slot_nr);
2943*4882a593Smuzhiyun }
2944*4882a593Smuzhiyun
2945*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
2946*4882a593Smuzhiyun }
2947*4882a593Smuzhiyun
2948*4882a593Smuzhiyun static void js_return_worker(struct work_struct *data)
2949*4882a593Smuzhiyun {
2950*4882a593Smuzhiyun struct kbase_jd_atom *katom = container_of(data, struct kbase_jd_atom,
2951*4882a593Smuzhiyun work);
2952*4882a593Smuzhiyun struct kbase_context *kctx = katom->kctx;
2953*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
2954*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata = &kbdev->js_data;
2955*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info = &kctx->jctx.sched_info;
2956*4882a593Smuzhiyun struct kbasep_js_atom_retained_state retained_state;
2957*4882a593Smuzhiyun int js = katom->slot_nr;
2958*4882a593Smuzhiyun bool slot_became_unblocked;
2959*4882a593Smuzhiyun bool timer_sync = false;
2960*4882a593Smuzhiyun bool context_idle = false;
2961*4882a593Smuzhiyun unsigned long flags;
2962*4882a593Smuzhiyun base_jd_core_req core_req = katom->core_req;
2963*4882a593Smuzhiyun u64 cache_jc = katom->jc;
2964*4882a593Smuzhiyun
2965*4882a593Smuzhiyun dev_dbg(kbdev->dev, "%s for atom %pK with event code 0x%x\n",
2966*4882a593Smuzhiyun __func__, (void *)katom, katom->event_code);
2967*4882a593Smuzhiyun
2968*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM(kbdev, JS_RETURN_WORKER, kctx, katom, katom->jc, 0);
2969*4882a593Smuzhiyun
2970*4882a593Smuzhiyun if (katom->event_code != BASE_JD_EVENT_END_RP_DONE)
2971*4882a593Smuzhiyun KBASE_TLSTREAM_TL_EVENT_ATOM_SOFTSTOP_EX(kbdev, katom);
2972*4882a593Smuzhiyun
2973*4882a593Smuzhiyun kbase_backend_complete_wq(kbdev, katom);
2974*4882a593Smuzhiyun
2975*4882a593Smuzhiyun kbasep_js_atom_retained_state_copy(&retained_state, katom);
2976*4882a593Smuzhiyun
2977*4882a593Smuzhiyun mutex_lock(&js_devdata->queue_mutex);
2978*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
2979*4882a593Smuzhiyun
2980*4882a593Smuzhiyun if (katom->event_code != BASE_JD_EVENT_END_RP_DONE)
2981*4882a593Smuzhiyun atomic_dec(&katom->blocked);
2982*4882a593Smuzhiyun
2983*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
2984*4882a593Smuzhiyun
2985*4882a593Smuzhiyun slot_became_unblocked = kbase_jsctx_slot_atom_pulled_dec(kctx, katom);
2986*4882a593Smuzhiyun
2987*4882a593Smuzhiyun if (!kbase_jsctx_slot_atoms_pulled(kctx, js) &&
2988*4882a593Smuzhiyun jsctx_rb_none_to_pull(kctx, js))
2989*4882a593Smuzhiyun timer_sync |= kbase_js_ctx_list_remove_nolock(kbdev, kctx, js);
2990*4882a593Smuzhiyun
2991*4882a593Smuzhiyun /* If the context is now unblocked on this slot after soft-stopped
2992*4882a593Smuzhiyun * atoms, then only mark it as pullable on this slot if it is not
2993*4882a593Smuzhiyun * idle
2994*4882a593Smuzhiyun */
2995*4882a593Smuzhiyun if (slot_became_unblocked && kbase_jsctx_atoms_pulled(kctx) &&
2996*4882a593Smuzhiyun kbase_js_ctx_pullable(kctx, js, true))
2997*4882a593Smuzhiyun timer_sync |=
2998*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(kbdev, kctx, js);
2999*4882a593Smuzhiyun
3000*4882a593Smuzhiyun if (!kbase_jsctx_atoms_pulled(kctx)) {
3001*4882a593Smuzhiyun dev_dbg(kbdev->dev,
3002*4882a593Smuzhiyun "No atoms currently pulled from context %pK\n",
3003*4882a593Smuzhiyun (void *)kctx);
3004*4882a593Smuzhiyun
3005*4882a593Smuzhiyun if (!kctx->slots_pullable) {
3006*4882a593Smuzhiyun dev_dbg(kbdev->dev,
3007*4882a593Smuzhiyun "Context %pK %s counted as runnable\n",
3008*4882a593Smuzhiyun (void *)kctx,
3009*4882a593Smuzhiyun kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF) ?
3010*4882a593Smuzhiyun "is" : "isn't");
3011*4882a593Smuzhiyun
3012*4882a593Smuzhiyun WARN_ON(!kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF));
3013*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_RUNNABLE_REF);
3014*4882a593Smuzhiyun atomic_dec(&kbdev->js_data.nr_contexts_runnable);
3015*4882a593Smuzhiyun timer_sync = true;
3016*4882a593Smuzhiyun }
3017*4882a593Smuzhiyun
3018*4882a593Smuzhiyun if (kctx->as_nr != KBASEP_AS_NR_INVALID &&
3019*4882a593Smuzhiyun !kbase_ctx_flag(kctx, KCTX_DYING)) {
3020*4882a593Smuzhiyun int num_slots = kbdev->gpu_props.num_job_slots;
3021*4882a593Smuzhiyun int slot;
3022*4882a593Smuzhiyun
3023*4882a593Smuzhiyun if (!kbasep_js_is_submit_allowed(js_devdata, kctx))
3024*4882a593Smuzhiyun kbasep_js_set_submit_allowed(js_devdata, kctx);
3025*4882a593Smuzhiyun
3026*4882a593Smuzhiyun for (slot = 0; slot < num_slots; slot++) {
3027*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, slot, true))
3028*4882a593Smuzhiyun timer_sync |=
3029*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
3030*4882a593Smuzhiyun kbdev, kctx, slot);
3031*4882a593Smuzhiyun }
3032*4882a593Smuzhiyun }
3033*4882a593Smuzhiyun
3034*4882a593Smuzhiyun kbase_jm_idle_ctx(kbdev, kctx);
3035*4882a593Smuzhiyun
3036*4882a593Smuzhiyun context_idle = true;
3037*4882a593Smuzhiyun }
3038*4882a593Smuzhiyun
3039*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3040*4882a593Smuzhiyun
3041*4882a593Smuzhiyun if (context_idle) {
3042*4882a593Smuzhiyun dev_dbg(kbdev->dev,
3043*4882a593Smuzhiyun "Context %pK %s counted as active\n",
3044*4882a593Smuzhiyun (void *)kctx,
3045*4882a593Smuzhiyun kbase_ctx_flag(kctx, KCTX_ACTIVE) ?
3046*4882a593Smuzhiyun "is" : "isn't");
3047*4882a593Smuzhiyun WARN_ON(!kbase_ctx_flag(kctx, KCTX_ACTIVE));
3048*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_ACTIVE);
3049*4882a593Smuzhiyun kbase_pm_context_idle(kbdev);
3050*4882a593Smuzhiyun }
3051*4882a593Smuzhiyun
3052*4882a593Smuzhiyun if (timer_sync)
3053*4882a593Smuzhiyun kbase_js_sync_timers(kbdev);
3054*4882a593Smuzhiyun
3055*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
3056*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
3057*4882a593Smuzhiyun
3058*4882a593Smuzhiyun if (katom->core_req & BASE_JD_REQ_START_RENDERPASS) {
3059*4882a593Smuzhiyun mutex_lock(&kctx->jctx.lock);
3060*4882a593Smuzhiyun js_return_of_start_rp(katom);
3061*4882a593Smuzhiyun mutex_unlock(&kctx->jctx.lock);
3062*4882a593Smuzhiyun } else if (katom->event_code == BASE_JD_EVENT_END_RP_DONE) {
3063*4882a593Smuzhiyun mutex_lock(&kctx->jctx.lock);
3064*4882a593Smuzhiyun js_return_of_end_rp(katom);
3065*4882a593Smuzhiyun mutex_unlock(&kctx->jctx.lock);
3066*4882a593Smuzhiyun }
3067*4882a593Smuzhiyun
3068*4882a593Smuzhiyun dev_dbg(kbdev->dev, "JS: retained state %s finished",
3069*4882a593Smuzhiyun kbasep_js_has_atom_finished(&retained_state) ?
3070*4882a593Smuzhiyun "has" : "hasn't");
3071*4882a593Smuzhiyun
3072*4882a593Smuzhiyun WARN_ON(kbasep_js_has_atom_finished(&retained_state));
3073*4882a593Smuzhiyun
3074*4882a593Smuzhiyun kbasep_js_runpool_release_ctx_and_katom_retained_state(kbdev, kctx,
3075*4882a593Smuzhiyun &retained_state);
3076*4882a593Smuzhiyun
3077*4882a593Smuzhiyun kbase_js_sched_all(kbdev);
3078*4882a593Smuzhiyun
3079*4882a593Smuzhiyun kbase_backend_complete_wq_post_sched(kbdev, core_req);
3080*4882a593Smuzhiyun
3081*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM(kbdev, JS_RETURN_WORKER_END, kctx, NULL, cache_jc,
3082*4882a593Smuzhiyun 0);
3083*4882a593Smuzhiyun
3084*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Leaving %s for atom %pK\n",
3085*4882a593Smuzhiyun __func__, (void *)katom);
3086*4882a593Smuzhiyun }
3087*4882a593Smuzhiyun
3088*4882a593Smuzhiyun void kbase_js_unpull(struct kbase_context *kctx, struct kbase_jd_atom *katom)
3089*4882a593Smuzhiyun {
3090*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Unpulling atom %pK in kctx %pK\n",
3091*4882a593Smuzhiyun (void *)katom, (void *)kctx);
3092*4882a593Smuzhiyun
3093*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
3094*4882a593Smuzhiyun
3095*4882a593Smuzhiyun jsctx_rb_unpull(kctx, katom);
3096*4882a593Smuzhiyun
3097*4882a593Smuzhiyun WARN_ON(work_pending(&katom->work));
3098*4882a593Smuzhiyun
3099*4882a593Smuzhiyun /* Block re-submission until workqueue has run */
3100*4882a593Smuzhiyun atomic_inc(&katom->blocked);
3101*4882a593Smuzhiyun
3102*4882a593Smuzhiyun kbase_job_check_leave_disjoint(kctx->kbdev, katom);
3103*4882a593Smuzhiyun
3104*4882a593Smuzhiyun INIT_WORK(&katom->work, js_return_worker);
3105*4882a593Smuzhiyun queue_work(kctx->jctx.job_done_wq, &katom->work);
3106*4882a593Smuzhiyun }
3107*4882a593Smuzhiyun
3108*4882a593Smuzhiyun /**
3109*4882a593Smuzhiyun * js_complete_start_rp() - Handle completion of atom that starts a renderpass
3110*4882a593Smuzhiyun * @kctx: Context pointer
3111*4882a593Smuzhiyun * @start_katom: Pointer to the atom that completed
3112*4882a593Smuzhiyun *
3113*4882a593Smuzhiyun * Put any references to virtual memory regions that might have been added by
3114*4882a593Smuzhiyun * kbase_job_slot_softstop_start_rp() because the tiler job chain completed
3115*4882a593Smuzhiyun * despite any pending soft-stop request.
3116*4882a593Smuzhiyun *
3117*4882a593Smuzhiyun * If the atom that just completed was soft-stopped during a previous attempt to
3118*4882a593Smuzhiyun * run it then there should be a blocked end-of-renderpass atom waiting for it,
3119*4882a593Smuzhiyun * which we must unblock to process the output of the tiler job chain.
3120*4882a593Smuzhiyun *
3121*4882a593Smuzhiyun * Return: true if caller should call kbase_backend_ctx_count_changed()
3122*4882a593Smuzhiyun */
3123*4882a593Smuzhiyun static bool js_complete_start_rp(struct kbase_context *kctx,
3124*4882a593Smuzhiyun struct kbase_jd_atom *const start_katom)
3125*4882a593Smuzhiyun {
3126*4882a593Smuzhiyun struct kbase_device *const kbdev = kctx->kbdev;
3127*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
3128*4882a593Smuzhiyun bool timer_sync = false;
3129*4882a593Smuzhiyun
3130*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
3131*4882a593Smuzhiyun
3132*4882a593Smuzhiyun if (WARN_ON(!(start_katom->core_req & BASE_JD_REQ_START_RENDERPASS)))
3133*4882a593Smuzhiyun return false;
3134*4882a593Smuzhiyun
3135*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(start_katom->renderpass_id) * 8)) <=
3136*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
3137*4882a593Smuzhiyun "Should check invalid access to renderpasses");
3138*4882a593Smuzhiyun
3139*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[start_katom->renderpass_id];
3140*4882a593Smuzhiyun
3141*4882a593Smuzhiyun if (WARN_ON(rp->start_katom != start_katom))
3142*4882a593Smuzhiyun return false;
3143*4882a593Smuzhiyun
3144*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
3145*4882a593Smuzhiyun "Start atom %pK is done in state %d of RP %d\n",
3146*4882a593Smuzhiyun (void *)start_katom, (int)rp->state,
3147*4882a593Smuzhiyun start_katom->renderpass_id);
3148*4882a593Smuzhiyun
3149*4882a593Smuzhiyun if (WARN_ON(rp->state == KBASE_JD_RP_COMPLETE))
3150*4882a593Smuzhiyun return false;
3151*4882a593Smuzhiyun
3152*4882a593Smuzhiyun if (rp->state == KBASE_JD_RP_PEND_OOM ||
3153*4882a593Smuzhiyun rp->state == KBASE_JD_RP_RETRY_PEND_OOM) {
3154*4882a593Smuzhiyun unsigned long flags;
3155*4882a593Smuzhiyun
3156*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
3157*4882a593Smuzhiyun "Start atom %pK completed before soft-stop\n",
3158*4882a593Smuzhiyun (void *)start_katom);
3159*4882a593Smuzhiyun
3160*4882a593Smuzhiyun kbase_gpu_vm_lock(kctx);
3161*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3162*4882a593Smuzhiyun
3163*4882a593Smuzhiyun while (!list_empty(&rp->oom_reg_list)) {
3164*4882a593Smuzhiyun struct kbase_va_region *reg =
3165*4882a593Smuzhiyun list_first_entry(&rp->oom_reg_list,
3166*4882a593Smuzhiyun struct kbase_va_region, link);
3167*4882a593Smuzhiyun
3168*4882a593Smuzhiyun WARN_ON(reg->flags & KBASE_REG_VA_FREED);
3169*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev, "Deleting region %pK from list\n",
3170*4882a593Smuzhiyun (void *)reg);
3171*4882a593Smuzhiyun list_del_init(®->link);
3172*4882a593Smuzhiyun kbase_va_region_alloc_put(kctx, reg);
3173*4882a593Smuzhiyun }
3174*4882a593Smuzhiyun
3175*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3176*4882a593Smuzhiyun kbase_gpu_vm_unlock(kctx);
3177*4882a593Smuzhiyun } else {
3178*4882a593Smuzhiyun dev_dbg(kctx->kbdev->dev,
3179*4882a593Smuzhiyun "Start atom %pK did not exceed memory threshold\n",
3180*4882a593Smuzhiyun (void *)start_katom);
3181*4882a593Smuzhiyun
3182*4882a593Smuzhiyun WARN_ON(rp->state != KBASE_JD_RP_START &&
3183*4882a593Smuzhiyun rp->state != KBASE_JD_RP_RETRY);
3184*4882a593Smuzhiyun }
3185*4882a593Smuzhiyun
3186*4882a593Smuzhiyun if (rp->state == KBASE_JD_RP_RETRY ||
3187*4882a593Smuzhiyun rp->state == KBASE_JD_RP_RETRY_PEND_OOM) {
3188*4882a593Smuzhiyun struct kbase_jd_atom *const end_katom = rp->end_katom;
3189*4882a593Smuzhiyun
3190*4882a593Smuzhiyun if (!WARN_ON(!end_katom)) {
3191*4882a593Smuzhiyun unsigned long flags;
3192*4882a593Smuzhiyun
3193*4882a593Smuzhiyun /* Allow the end of the renderpass to be pulled for
3194*4882a593Smuzhiyun * execution again to continue incremental rendering.
3195*4882a593Smuzhiyun */
3196*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Unblocking end atom %pK!\n",
3197*4882a593Smuzhiyun (void *)end_katom);
3198*4882a593Smuzhiyun atomic_dec(&end_katom->blocked);
3199*4882a593Smuzhiyun
3200*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3201*4882a593Smuzhiyun timer_sync = kbase_js_ctx_list_add_pullable_nolock(
3202*4882a593Smuzhiyun kbdev, kctx, end_katom->slot_nr);
3203*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3204*4882a593Smuzhiyun }
3205*4882a593Smuzhiyun }
3206*4882a593Smuzhiyun
3207*4882a593Smuzhiyun return timer_sync;
3208*4882a593Smuzhiyun }
3209*4882a593Smuzhiyun
3210*4882a593Smuzhiyun /**
3211*4882a593Smuzhiyun * js_complete_end_rp() - Handle final completion of atom that ends a renderpass
3212*4882a593Smuzhiyun * @kctx: Context pointer
3213*4882a593Smuzhiyun * @end_katom: Pointer to the atom that completed for the last time
3214*4882a593Smuzhiyun *
3215*4882a593Smuzhiyun * This function must only be called if the renderpass actually completed
3216*4882a593Smuzhiyun * without the tiler job chain at the start using too much memory; otherwise
3217*4882a593Smuzhiyun * completion of the end-of-renderpass atom is handled similarly to a soft-stop.
3218*4882a593Smuzhiyun */
3219*4882a593Smuzhiyun static void js_complete_end_rp(struct kbase_context *kctx,
3220*4882a593Smuzhiyun struct kbase_jd_atom *const end_katom)
3221*4882a593Smuzhiyun {
3222*4882a593Smuzhiyun struct kbase_device *const kbdev = kctx->kbdev;
3223*4882a593Smuzhiyun unsigned long flags;
3224*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
3225*4882a593Smuzhiyun
3226*4882a593Smuzhiyun lockdep_assert_held(&kctx->jctx.lock);
3227*4882a593Smuzhiyun
3228*4882a593Smuzhiyun if (WARN_ON(!(end_katom->core_req & BASE_JD_REQ_END_RENDERPASS)))
3229*4882a593Smuzhiyun return;
3230*4882a593Smuzhiyun
3231*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(end_katom->renderpass_id) * 8)) <=
3232*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
3233*4882a593Smuzhiyun "Should check invalid access to renderpasses");
3234*4882a593Smuzhiyun
3235*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[end_katom->renderpass_id];
3236*4882a593Smuzhiyun
3237*4882a593Smuzhiyun if (WARN_ON(rp->end_katom != end_katom))
3238*4882a593Smuzhiyun return;
3239*4882a593Smuzhiyun
3240*4882a593Smuzhiyun dev_dbg(kbdev->dev, "End atom %pK is done in state %d of RP %d\n",
3241*4882a593Smuzhiyun (void *)end_katom, (int)rp->state, end_katom->renderpass_id);
3242*4882a593Smuzhiyun
3243*4882a593Smuzhiyun if (WARN_ON(rp->state == KBASE_JD_RP_COMPLETE) ||
3244*4882a593Smuzhiyun WARN_ON(rp->state == KBASE_JD_RP_OOM) ||
3245*4882a593Smuzhiyun WARN_ON(rp->state == KBASE_JD_RP_RETRY_OOM))
3246*4882a593Smuzhiyun return;
3247*4882a593Smuzhiyun
3248*4882a593Smuzhiyun /* Rendering completed without running out of memory.
3249*4882a593Smuzhiyun */
3250*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3251*4882a593Smuzhiyun WARN_ON(!list_empty(&rp->oom_reg_list));
3252*4882a593Smuzhiyun rp->state = KBASE_JD_RP_COMPLETE;
3253*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3254*4882a593Smuzhiyun
3255*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Renderpass %d is complete\n",
3256*4882a593Smuzhiyun end_katom->renderpass_id);
3257*4882a593Smuzhiyun }
3258*4882a593Smuzhiyun
3259*4882a593Smuzhiyun bool kbase_js_complete_atom_wq(struct kbase_context *kctx,
3260*4882a593Smuzhiyun struct kbase_jd_atom *katom)
3261*4882a593Smuzhiyun {
3262*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info;
3263*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
3264*4882a593Smuzhiyun struct kbase_device *kbdev;
3265*4882a593Smuzhiyun unsigned long flags;
3266*4882a593Smuzhiyun bool timer_sync = false;
3267*4882a593Smuzhiyun int atom_slot;
3268*4882a593Smuzhiyun bool context_idle = false;
3269*4882a593Smuzhiyun int prio = katom->sched_priority;
3270*4882a593Smuzhiyun
3271*4882a593Smuzhiyun kbdev = kctx->kbdev;
3272*4882a593Smuzhiyun atom_slot = katom->slot_nr;
3273*4882a593Smuzhiyun
3274*4882a593Smuzhiyun dev_dbg(kbdev->dev, "%s for atom %pK (s:%d)\n",
3275*4882a593Smuzhiyun __func__, (void *)katom, atom_slot);
3276*4882a593Smuzhiyun
3277*4882a593Smuzhiyun /* Update the incremental rendering state machine.
3278*4882a593Smuzhiyun */
3279*4882a593Smuzhiyun if (katom->core_req & BASE_JD_REQ_START_RENDERPASS)
3280*4882a593Smuzhiyun timer_sync |= js_complete_start_rp(kctx, katom);
3281*4882a593Smuzhiyun else if (katom->core_req & BASE_JD_REQ_END_RENDERPASS)
3282*4882a593Smuzhiyun js_complete_end_rp(kctx, katom);
3283*4882a593Smuzhiyun
3284*4882a593Smuzhiyun js_kctx_info = &kctx->jctx.sched_info;
3285*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
3286*4882a593Smuzhiyun
3287*4882a593Smuzhiyun lockdep_assert_held(&js_kctx_info->ctx.jsctx_mutex);
3288*4882a593Smuzhiyun
3289*4882a593Smuzhiyun mutex_lock(&js_devdata->runpool_mutex);
3290*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3291*4882a593Smuzhiyun
3292*4882a593Smuzhiyun if (katom->atom_flags & KBASE_KATOM_FLAG_JSCTX_IN_TREE) {
3293*4882a593Smuzhiyun bool slot_became_unblocked;
3294*4882a593Smuzhiyun
3295*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Atom %pK is in runnable_tree\n",
3296*4882a593Smuzhiyun (void *)katom);
3297*4882a593Smuzhiyun
3298*4882a593Smuzhiyun slot_became_unblocked =
3299*4882a593Smuzhiyun kbase_jsctx_slot_atom_pulled_dec(kctx, katom);
3300*4882a593Smuzhiyun context_idle = !kbase_jsctx_atoms_pulled(kctx);
3301*4882a593Smuzhiyun
3302*4882a593Smuzhiyun if (!kbase_jsctx_atoms_pulled(kctx) && !kctx->slots_pullable) {
3303*4882a593Smuzhiyun WARN_ON(!kbase_ctx_flag(kctx, KCTX_RUNNABLE_REF));
3304*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_RUNNABLE_REF);
3305*4882a593Smuzhiyun atomic_dec(&kbdev->js_data.nr_contexts_runnable);
3306*4882a593Smuzhiyun timer_sync = true;
3307*4882a593Smuzhiyun }
3308*4882a593Smuzhiyun
3309*4882a593Smuzhiyun /* If this slot has been blocked due to soft-stopped atoms, and
3310*4882a593Smuzhiyun * all atoms have now been processed at this priority level and
3311*4882a593Smuzhiyun * higher, then unblock the slot
3312*4882a593Smuzhiyun */
3313*4882a593Smuzhiyun if (slot_became_unblocked) {
3314*4882a593Smuzhiyun dev_dbg(kbdev->dev,
3315*4882a593Smuzhiyun "kctx %pK is no longer blocked from submitting on slot %d at priority %d or higher\n",
3316*4882a593Smuzhiyun (void *)kctx, atom_slot, prio);
3317*4882a593Smuzhiyun
3318*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, atom_slot, true))
3319*4882a593Smuzhiyun timer_sync |=
3320*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
3321*4882a593Smuzhiyun kbdev, kctx, atom_slot);
3322*4882a593Smuzhiyun }
3323*4882a593Smuzhiyun }
3324*4882a593Smuzhiyun WARN_ON(!(katom->atom_flags & KBASE_KATOM_FLAG_JSCTX_IN_TREE));
3325*4882a593Smuzhiyun
3326*4882a593Smuzhiyun if (!kbase_jsctx_slot_atoms_pulled(kctx, atom_slot) &&
3327*4882a593Smuzhiyun jsctx_rb_none_to_pull(kctx, atom_slot)) {
3328*4882a593Smuzhiyun if (!list_empty(
3329*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.ctx_list_entry[atom_slot]))
3330*4882a593Smuzhiyun timer_sync |= kbase_js_ctx_list_remove_nolock(
3331*4882a593Smuzhiyun kctx->kbdev, kctx, atom_slot);
3332*4882a593Smuzhiyun }
3333*4882a593Smuzhiyun
3334*4882a593Smuzhiyun /*
3335*4882a593Smuzhiyun * If submission is disabled on this context (most likely due to an
3336*4882a593Smuzhiyun * atom failure) and there are now no atoms left in the system then
3337*4882a593Smuzhiyun * re-enable submission so that context can be scheduled again.
3338*4882a593Smuzhiyun */
3339*4882a593Smuzhiyun if (!kbasep_js_is_submit_allowed(js_devdata, kctx) &&
3340*4882a593Smuzhiyun !kbase_jsctx_atoms_pulled(kctx) &&
3341*4882a593Smuzhiyun !kbase_ctx_flag(kctx, KCTX_DYING)) {
3342*4882a593Smuzhiyun unsigned int js;
3343*4882a593Smuzhiyun
3344*4882a593Smuzhiyun kbasep_js_set_submit_allowed(js_devdata, kctx);
3345*4882a593Smuzhiyun
3346*4882a593Smuzhiyun for (js = 0; js < kbdev->gpu_props.num_job_slots; js++) {
3347*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, js, true))
3348*4882a593Smuzhiyun timer_sync |=
3349*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
3350*4882a593Smuzhiyun kbdev, kctx, js);
3351*4882a593Smuzhiyun }
3352*4882a593Smuzhiyun } else if (katom->x_post_dep &&
3353*4882a593Smuzhiyun kbasep_js_is_submit_allowed(js_devdata, kctx)) {
3354*4882a593Smuzhiyun unsigned int js;
3355*4882a593Smuzhiyun
3356*4882a593Smuzhiyun for (js = 0; js < kbdev->gpu_props.num_job_slots; js++) {
3357*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, js, true))
3358*4882a593Smuzhiyun timer_sync |=
3359*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
3360*4882a593Smuzhiyun kbdev, kctx, js);
3361*4882a593Smuzhiyun }
3362*4882a593Smuzhiyun }
3363*4882a593Smuzhiyun
3364*4882a593Smuzhiyun /* Mark context as inactive. The pm reference will be dropped later in
3365*4882a593Smuzhiyun * jd_done_worker().
3366*4882a593Smuzhiyun */
3367*4882a593Smuzhiyun if (context_idle) {
3368*4882a593Smuzhiyun dev_dbg(kbdev->dev, "kctx %pK is no longer active\n",
3369*4882a593Smuzhiyun (void *)kctx);
3370*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_ACTIVE);
3371*4882a593Smuzhiyun }
3372*4882a593Smuzhiyun
3373*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3374*4882a593Smuzhiyun if (timer_sync)
3375*4882a593Smuzhiyun kbase_backend_ctx_count_changed(kbdev);
3376*4882a593Smuzhiyun mutex_unlock(&js_devdata->runpool_mutex);
3377*4882a593Smuzhiyun
3378*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Leaving %s\n", __func__);
3379*4882a593Smuzhiyun return context_idle;
3380*4882a593Smuzhiyun }
3381*4882a593Smuzhiyun
3382*4882a593Smuzhiyun /**
3383*4882a593Smuzhiyun * js_end_rp_is_complete() - Check whether an atom that ends a renderpass has
3384*4882a593Smuzhiyun * completed for the last time.
3385*4882a593Smuzhiyun *
3386*4882a593Smuzhiyun * @end_katom: Pointer to the atom that completed on the hardware.
3387*4882a593Smuzhiyun *
3388*4882a593Smuzhiyun * An atom that ends a renderpass may be run on the hardware several times
3389*4882a593Smuzhiyun * before notifying userspace or allowing dependent atoms to be executed.
3390*4882a593Smuzhiyun *
3391*4882a593Smuzhiyun * This function is used to decide whether or not to allow end-of-renderpass
3392*4882a593Smuzhiyun * atom completion. It only returns false if the atom at the start of the
3393*4882a593Smuzhiyun * renderpass was soft-stopped because it used too much memory during the most
3394*4882a593Smuzhiyun * recent attempt at tiling.
3395*4882a593Smuzhiyun *
3396*4882a593Smuzhiyun * Return: True if the atom completed for the last time.
3397*4882a593Smuzhiyun */
3398*4882a593Smuzhiyun static bool js_end_rp_is_complete(struct kbase_jd_atom *const end_katom)
3399*4882a593Smuzhiyun {
3400*4882a593Smuzhiyun struct kbase_context *const kctx = end_katom->kctx;
3401*4882a593Smuzhiyun struct kbase_device *const kbdev = kctx->kbdev;
3402*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
3403*4882a593Smuzhiyun
3404*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
3405*4882a593Smuzhiyun
3406*4882a593Smuzhiyun if (WARN_ON(!(end_katom->core_req & BASE_JD_REQ_END_RENDERPASS)))
3407*4882a593Smuzhiyun return true;
3408*4882a593Smuzhiyun
3409*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(end_katom->renderpass_id) * 8)) <=
3410*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
3411*4882a593Smuzhiyun "Should check invalid access to renderpasses");
3412*4882a593Smuzhiyun
3413*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[end_katom->renderpass_id];
3414*4882a593Smuzhiyun
3415*4882a593Smuzhiyun if (WARN_ON(rp->end_katom != end_katom))
3416*4882a593Smuzhiyun return true;
3417*4882a593Smuzhiyun
3418*4882a593Smuzhiyun dev_dbg(kbdev->dev,
3419*4882a593Smuzhiyun "JS complete end atom %pK in state %d of RP %d\n",
3420*4882a593Smuzhiyun (void *)end_katom, (int)rp->state,
3421*4882a593Smuzhiyun end_katom->renderpass_id);
3422*4882a593Smuzhiyun
3423*4882a593Smuzhiyun if (WARN_ON(rp->state == KBASE_JD_RP_COMPLETE))
3424*4882a593Smuzhiyun return true;
3425*4882a593Smuzhiyun
3426*4882a593Smuzhiyun /* Failure of end-of-renderpass atoms must not return to the
3427*4882a593Smuzhiyun * start of the renderpass.
3428*4882a593Smuzhiyun */
3429*4882a593Smuzhiyun if (end_katom->event_code != BASE_JD_EVENT_DONE)
3430*4882a593Smuzhiyun return true;
3431*4882a593Smuzhiyun
3432*4882a593Smuzhiyun if (rp->state != KBASE_JD_RP_OOM &&
3433*4882a593Smuzhiyun rp->state != KBASE_JD_RP_RETRY_OOM)
3434*4882a593Smuzhiyun return true;
3435*4882a593Smuzhiyun
3436*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Suppressing end atom completion\n");
3437*4882a593Smuzhiyun return false;
3438*4882a593Smuzhiyun }
3439*4882a593Smuzhiyun
3440*4882a593Smuzhiyun struct kbase_jd_atom *kbase_js_complete_atom(struct kbase_jd_atom *katom,
3441*4882a593Smuzhiyun ktime_t *end_timestamp)
3442*4882a593Smuzhiyun {
3443*4882a593Smuzhiyun struct kbase_device *kbdev;
3444*4882a593Smuzhiyun struct kbase_context *kctx = katom->kctx;
3445*4882a593Smuzhiyun struct kbase_jd_atom *x_dep = katom->x_post_dep;
3446*4882a593Smuzhiyun
3447*4882a593Smuzhiyun kbdev = kctx->kbdev;
3448*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Atom %pK complete in kctx %pK (post-dep %pK)\n",
3449*4882a593Smuzhiyun (void *)katom, (void *)kctx, (void *)x_dep);
3450*4882a593Smuzhiyun
3451*4882a593Smuzhiyun lockdep_assert_held(&kctx->kbdev->hwaccess_lock);
3452*4882a593Smuzhiyun
3453*4882a593Smuzhiyun if ((katom->core_req & BASE_JD_REQ_END_RENDERPASS) &&
3454*4882a593Smuzhiyun !js_end_rp_is_complete(katom)) {
3455*4882a593Smuzhiyun katom->event_code = BASE_JD_EVENT_END_RP_DONE;
3456*4882a593Smuzhiyun kbase_js_unpull(kctx, katom);
3457*4882a593Smuzhiyun return NULL;
3458*4882a593Smuzhiyun }
3459*4882a593Smuzhiyun
3460*4882a593Smuzhiyun if (katom->will_fail_event_code)
3461*4882a593Smuzhiyun katom->event_code = katom->will_fail_event_code;
3462*4882a593Smuzhiyun
3463*4882a593Smuzhiyun katom->status = KBASE_JD_ATOM_STATE_HW_COMPLETED;
3464*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Atom %pK status to HW completed\n", (void *)katom);
3465*4882a593Smuzhiyun if (kbase_is_quick_reset_enabled(kbdev)) {
3466*4882a593Smuzhiyun kbdev->num_of_atoms_hw_completed++;
3467*4882a593Smuzhiyun if (kbdev->num_of_atoms_hw_completed >= 20)
3468*4882a593Smuzhiyun kbase_disable_quick_reset(kbdev);
3469*4882a593Smuzhiyun }
3470*4882a593Smuzhiyun
3471*4882a593Smuzhiyun if (katom->event_code != BASE_JD_EVENT_DONE) {
3472*4882a593Smuzhiyun kbase_js_evict_deps(kctx, katom, katom->slot_nr,
3473*4882a593Smuzhiyun katom->sched_priority);
3474*4882a593Smuzhiyun }
3475*4882a593Smuzhiyun
3476*4882a593Smuzhiyun KBASE_TLSTREAM_AUX_EVENT_JOB_SLOT(kbdev, NULL,
3477*4882a593Smuzhiyun katom->slot_nr, 0, TL_JS_EVENT_STOP);
3478*4882a593Smuzhiyun
3479*4882a593Smuzhiyun trace_sysgraph_gpu(SGR_COMPLETE, kctx->id,
3480*4882a593Smuzhiyun kbase_jd_atom_id(katom->kctx, katom), katom->slot_nr);
3481*4882a593Smuzhiyun
3482*4882a593Smuzhiyun KBASE_TLSTREAM_TL_JD_DONE_START(kbdev, katom);
3483*4882a593Smuzhiyun kbase_jd_done(katom, katom->slot_nr, end_timestamp, 0);
3484*4882a593Smuzhiyun KBASE_TLSTREAM_TL_JD_DONE_END(kbdev, katom);
3485*4882a593Smuzhiyun
3486*4882a593Smuzhiyun /* Unblock cross dependency if present */
3487*4882a593Smuzhiyun if (x_dep && (katom->event_code == BASE_JD_EVENT_DONE ||
3488*4882a593Smuzhiyun !(x_dep->atom_flags & KBASE_KATOM_FLAG_FAIL_BLOCKER)) &&
3489*4882a593Smuzhiyun (x_dep->atom_flags & KBASE_KATOM_FLAG_JSCTX_IN_X_DEP_LIST)) {
3490*4882a593Smuzhiyun bool was_pullable = kbase_js_ctx_pullable(kctx, x_dep->slot_nr,
3491*4882a593Smuzhiyun false);
3492*4882a593Smuzhiyun x_dep->atom_flags &= ~KBASE_KATOM_FLAG_X_DEP_BLOCKED;
3493*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Cleared X_DEP flag on atom %pK\n",
3494*4882a593Smuzhiyun (void *)x_dep);
3495*4882a593Smuzhiyun
3496*4882a593Smuzhiyun kbase_js_move_to_tree(x_dep);
3497*4882a593Smuzhiyun
3498*4882a593Smuzhiyun if (!was_pullable && kbase_js_ctx_pullable(kctx, x_dep->slot_nr,
3499*4882a593Smuzhiyun false))
3500*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(kbdev, kctx,
3501*4882a593Smuzhiyun x_dep->slot_nr);
3502*4882a593Smuzhiyun
3503*4882a593Smuzhiyun if (x_dep->atom_flags & KBASE_KATOM_FLAG_JSCTX_IN_TREE) {
3504*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Atom %pK is in runnable tree\n",
3505*4882a593Smuzhiyun (void *)x_dep);
3506*4882a593Smuzhiyun return x_dep;
3507*4882a593Smuzhiyun }
3508*4882a593Smuzhiyun } else {
3509*4882a593Smuzhiyun dev_dbg(kbdev->dev,
3510*4882a593Smuzhiyun "No cross-slot dep to unblock for atom %pK\n",
3511*4882a593Smuzhiyun (void *)katom);
3512*4882a593Smuzhiyun }
3513*4882a593Smuzhiyun
3514*4882a593Smuzhiyun return NULL;
3515*4882a593Smuzhiyun }
3516*4882a593Smuzhiyun
3517*4882a593Smuzhiyun /**
3518*4882a593Smuzhiyun * kbase_js_atom_blocked_on_x_dep - Decide whether to ignore a cross-slot
3519*4882a593Smuzhiyun * dependency
3520*4882a593Smuzhiyun * @katom: Pointer to an atom in the slot ringbuffer
3521*4882a593Smuzhiyun *
3522*4882a593Smuzhiyun * A cross-slot dependency is ignored if necessary to unblock incremental
3523*4882a593Smuzhiyun * rendering. If the atom at the start of a renderpass used too much memory
3524*4882a593Smuzhiyun * and was soft-stopped then the atom at the end of a renderpass is submitted
3525*4882a593Smuzhiyun * to hardware regardless of its dependency on the start-of-renderpass atom.
3526*4882a593Smuzhiyun * This can happen multiple times for the same pair of atoms.
3527*4882a593Smuzhiyun *
3528*4882a593Smuzhiyun * Return: true to block the atom or false to allow it to be submitted to
3529*4882a593Smuzhiyun * hardware
3530*4882a593Smuzhiyun */
3531*4882a593Smuzhiyun bool kbase_js_atom_blocked_on_x_dep(struct kbase_jd_atom *const katom)
3532*4882a593Smuzhiyun {
3533*4882a593Smuzhiyun struct kbase_context *const kctx = katom->kctx;
3534*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
3535*4882a593Smuzhiyun struct kbase_jd_renderpass *rp;
3536*4882a593Smuzhiyun
3537*4882a593Smuzhiyun lockdep_assert_held(&kbdev->hwaccess_lock);
3538*4882a593Smuzhiyun
3539*4882a593Smuzhiyun if (!(katom->atom_flags &
3540*4882a593Smuzhiyun KBASE_KATOM_FLAG_X_DEP_BLOCKED)) {
3541*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Atom %pK is not blocked on a cross-slot dependency",
3542*4882a593Smuzhiyun (void *)katom);
3543*4882a593Smuzhiyun return false;
3544*4882a593Smuzhiyun }
3545*4882a593Smuzhiyun
3546*4882a593Smuzhiyun if (!(katom->core_req & BASE_JD_REQ_END_RENDERPASS)) {
3547*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Atom %pK is blocked on a cross-slot dependency",
3548*4882a593Smuzhiyun (void *)katom);
3549*4882a593Smuzhiyun return true;
3550*4882a593Smuzhiyun }
3551*4882a593Smuzhiyun
3552*4882a593Smuzhiyun compiletime_assert((1ull << (sizeof(katom->renderpass_id) * 8)) <=
3553*4882a593Smuzhiyun ARRAY_SIZE(kctx->jctx.renderpasses),
3554*4882a593Smuzhiyun "Should check invalid access to renderpasses");
3555*4882a593Smuzhiyun
3556*4882a593Smuzhiyun rp = &kctx->jctx.renderpasses[katom->renderpass_id];
3557*4882a593Smuzhiyun /* We can read a subset of renderpass state without holding
3558*4882a593Smuzhiyun * higher-level locks (but not end_katom, for example).
3559*4882a593Smuzhiyun */
3560*4882a593Smuzhiyun
3561*4882a593Smuzhiyun WARN_ON(rp->state == KBASE_JD_RP_COMPLETE);
3562*4882a593Smuzhiyun
3563*4882a593Smuzhiyun dev_dbg(kbdev->dev, "End atom has cross-slot dep in state %d\n",
3564*4882a593Smuzhiyun (int)rp->state);
3565*4882a593Smuzhiyun
3566*4882a593Smuzhiyun if (rp->state != KBASE_JD_RP_OOM && rp->state != KBASE_JD_RP_RETRY_OOM)
3567*4882a593Smuzhiyun return true;
3568*4882a593Smuzhiyun
3569*4882a593Smuzhiyun /* Tiler ran out of memory so allow the fragment job chain to run
3570*4882a593Smuzhiyun * if it only depends on the tiler job chain.
3571*4882a593Smuzhiyun */
3572*4882a593Smuzhiyun if (katom->x_pre_dep != rp->start_katom) {
3573*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Dependency is on %pK not start atom %pK\n",
3574*4882a593Smuzhiyun (void *)katom->x_pre_dep, (void *)rp->start_katom);
3575*4882a593Smuzhiyun return true;
3576*4882a593Smuzhiyun }
3577*4882a593Smuzhiyun
3578*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Ignoring cross-slot dep on atom %pK\n",
3579*4882a593Smuzhiyun (void *)katom->x_pre_dep);
3580*4882a593Smuzhiyun
3581*4882a593Smuzhiyun return false;
3582*4882a593Smuzhiyun }
3583*4882a593Smuzhiyun
3584*4882a593Smuzhiyun void kbase_js_sched(struct kbase_device *kbdev, unsigned int js_mask)
3585*4882a593Smuzhiyun {
3586*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata;
3587*4882a593Smuzhiyun struct kbase_context *last_active[BASE_JM_MAX_NR_SLOTS];
3588*4882a593Smuzhiyun bool timer_sync = false;
3589*4882a593Smuzhiyun bool ctx_waiting[BASE_JM_MAX_NR_SLOTS];
3590*4882a593Smuzhiyun unsigned int js;
3591*4882a593Smuzhiyun
3592*4882a593Smuzhiyun KBASE_TLSTREAM_TL_JS_SCHED_START(kbdev, 0);
3593*4882a593Smuzhiyun
3594*4882a593Smuzhiyun dev_dbg(kbdev->dev, "%s kbdev %pK mask 0x%x\n",
3595*4882a593Smuzhiyun __func__, (void *)kbdev, (unsigned int)js_mask);
3596*4882a593Smuzhiyun
3597*4882a593Smuzhiyun js_devdata = &kbdev->js_data;
3598*4882a593Smuzhiyun
3599*4882a593Smuzhiyun down(&js_devdata->schedule_sem);
3600*4882a593Smuzhiyun mutex_lock(&js_devdata->queue_mutex);
3601*4882a593Smuzhiyun
3602*4882a593Smuzhiyun for (js = 0; js < BASE_JM_MAX_NR_SLOTS; js++) {
3603*4882a593Smuzhiyun last_active[js] = kbdev->hwaccess.active_kctx[js];
3604*4882a593Smuzhiyun ctx_waiting[js] = false;
3605*4882a593Smuzhiyun }
3606*4882a593Smuzhiyun
3607*4882a593Smuzhiyun while (js_mask) {
3608*4882a593Smuzhiyun js = ffs(js_mask) - 1;
3609*4882a593Smuzhiyun
3610*4882a593Smuzhiyun while (1) {
3611*4882a593Smuzhiyun struct kbase_context *kctx;
3612*4882a593Smuzhiyun unsigned long flags;
3613*4882a593Smuzhiyun bool context_idle = false;
3614*4882a593Smuzhiyun
3615*4882a593Smuzhiyun kctx = kbase_js_ctx_list_pop_head(kbdev, js);
3616*4882a593Smuzhiyun
3617*4882a593Smuzhiyun if (!kctx) {
3618*4882a593Smuzhiyun js_mask &= ~(1 << js);
3619*4882a593Smuzhiyun dev_dbg(kbdev->dev, "No kctx on pullable list (s:%u)\n", js);
3620*4882a593Smuzhiyun break;
3621*4882a593Smuzhiyun }
3622*4882a593Smuzhiyun
3623*4882a593Smuzhiyun if (!kbase_ctx_flag(kctx, KCTX_ACTIVE)) {
3624*4882a593Smuzhiyun context_idle = true;
3625*4882a593Smuzhiyun
3626*4882a593Smuzhiyun dev_dbg(kbdev->dev, "kctx %pK is not active (s:%u)\n", (void *)kctx,
3627*4882a593Smuzhiyun js);
3628*4882a593Smuzhiyun
3629*4882a593Smuzhiyun if (kbase_pm_context_active_handle_suspend(
3630*4882a593Smuzhiyun kbdev,
3631*4882a593Smuzhiyun KBASE_PM_SUSPEND_HANDLER_DONT_INCREASE)) {
3632*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Suspend pending (s:%u)\n", js);
3633*4882a593Smuzhiyun /* Suspend pending - return context to
3634*4882a593Smuzhiyun * queue and stop scheduling
3635*4882a593Smuzhiyun */
3636*4882a593Smuzhiyun mutex_lock(
3637*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.jsctx_mutex);
3638*4882a593Smuzhiyun if (kbase_js_ctx_list_add_pullable_head(
3639*4882a593Smuzhiyun kctx->kbdev, kctx, js))
3640*4882a593Smuzhiyun kbase_js_sync_timers(kbdev);
3641*4882a593Smuzhiyun mutex_unlock(
3642*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.jsctx_mutex);
3643*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
3644*4882a593Smuzhiyun up(&js_devdata->schedule_sem);
3645*4882a593Smuzhiyun KBASE_TLSTREAM_TL_JS_SCHED_END(kbdev,
3646*4882a593Smuzhiyun 0);
3647*4882a593Smuzhiyun return;
3648*4882a593Smuzhiyun }
3649*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_ACTIVE);
3650*4882a593Smuzhiyun }
3651*4882a593Smuzhiyun
3652*4882a593Smuzhiyun if (!kbase_js_use_ctx(kbdev, kctx, js)) {
3653*4882a593Smuzhiyun mutex_lock(
3654*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.jsctx_mutex);
3655*4882a593Smuzhiyun
3656*4882a593Smuzhiyun dev_dbg(kbdev->dev,
3657*4882a593Smuzhiyun "kctx %pK cannot be used at this time\n",
3658*4882a593Smuzhiyun kctx);
3659*4882a593Smuzhiyun
3660*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3661*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, js, false)
3662*4882a593Smuzhiyun || kbase_ctx_flag(kctx, KCTX_PRIVILEGED))
3663*4882a593Smuzhiyun timer_sync |=
3664*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_head_nolock(
3665*4882a593Smuzhiyun kctx->kbdev, kctx, js);
3666*4882a593Smuzhiyun else
3667*4882a593Smuzhiyun timer_sync |=
3668*4882a593Smuzhiyun kbase_js_ctx_list_add_unpullable_nolock(
3669*4882a593Smuzhiyun kctx->kbdev, kctx, js);
3670*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock,
3671*4882a593Smuzhiyun flags);
3672*4882a593Smuzhiyun mutex_unlock(
3673*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.jsctx_mutex);
3674*4882a593Smuzhiyun if (context_idle) {
3675*4882a593Smuzhiyun WARN_ON(!kbase_ctx_flag(kctx, KCTX_ACTIVE));
3676*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_ACTIVE);
3677*4882a593Smuzhiyun kbase_pm_context_idle(kbdev);
3678*4882a593Smuzhiyun }
3679*4882a593Smuzhiyun
3680*4882a593Smuzhiyun /* No more jobs can be submitted on this slot */
3681*4882a593Smuzhiyun js_mask &= ~(1 << js);
3682*4882a593Smuzhiyun break;
3683*4882a593Smuzhiyun }
3684*4882a593Smuzhiyun mutex_lock(&kctx->jctx.sched_info.ctx.jsctx_mutex);
3685*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3686*4882a593Smuzhiyun
3687*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_PULLED);
3688*4882a593Smuzhiyun
3689*4882a593Smuzhiyun if (!kbase_jm_kick(kbdev, 1 << js)) {
3690*4882a593Smuzhiyun dev_dbg(kbdev->dev, "No more jobs can be submitted (s:%u)\n", js);
3691*4882a593Smuzhiyun js_mask &= ~(1 << js);
3692*4882a593Smuzhiyun }
3693*4882a593Smuzhiyun if (!kbase_ctx_flag(kctx, KCTX_PULLED)) {
3694*4882a593Smuzhiyun bool pullable;
3695*4882a593Smuzhiyun
3696*4882a593Smuzhiyun dev_dbg(kbdev->dev, "No atoms pulled from kctx %pK (s:%u)\n",
3697*4882a593Smuzhiyun (void *)kctx, js);
3698*4882a593Smuzhiyun
3699*4882a593Smuzhiyun pullable = kbase_js_ctx_pullable(kctx, js,
3700*4882a593Smuzhiyun true);
3701*4882a593Smuzhiyun
3702*4882a593Smuzhiyun /* Failed to pull jobs - push to head of list.
3703*4882a593Smuzhiyun * Unless this context is already 'active', in
3704*4882a593Smuzhiyun * which case it's effectively already scheduled
3705*4882a593Smuzhiyun * so push it to the back of the list.
3706*4882a593Smuzhiyun */
3707*4882a593Smuzhiyun if (pullable && kctx == last_active[js] &&
3708*4882a593Smuzhiyun kbase_ctx_flag(kctx,
3709*4882a593Smuzhiyun (KCTX_PULLED_SINCE_ACTIVE_JS0 <<
3710*4882a593Smuzhiyun js)))
3711*4882a593Smuzhiyun timer_sync |=
3712*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
3713*4882a593Smuzhiyun kctx->kbdev,
3714*4882a593Smuzhiyun kctx, js);
3715*4882a593Smuzhiyun else if (pullable)
3716*4882a593Smuzhiyun timer_sync |=
3717*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_head_nolock(
3718*4882a593Smuzhiyun kctx->kbdev,
3719*4882a593Smuzhiyun kctx, js);
3720*4882a593Smuzhiyun else
3721*4882a593Smuzhiyun timer_sync |=
3722*4882a593Smuzhiyun kbase_js_ctx_list_add_unpullable_nolock(
3723*4882a593Smuzhiyun kctx->kbdev,
3724*4882a593Smuzhiyun kctx, js);
3725*4882a593Smuzhiyun
3726*4882a593Smuzhiyun /* If this context is not the active context,
3727*4882a593Smuzhiyun * but the active context is pullable on this
3728*4882a593Smuzhiyun * slot, then we need to remove the active
3729*4882a593Smuzhiyun * marker to prevent it from submitting atoms in
3730*4882a593Smuzhiyun * the IRQ handler, which would prevent this
3731*4882a593Smuzhiyun * context from making progress.
3732*4882a593Smuzhiyun */
3733*4882a593Smuzhiyun if (last_active[js] && kctx != last_active[js]
3734*4882a593Smuzhiyun && kbase_js_ctx_pullable(
3735*4882a593Smuzhiyun last_active[js], js, true))
3736*4882a593Smuzhiyun ctx_waiting[js] = true;
3737*4882a593Smuzhiyun
3738*4882a593Smuzhiyun if (context_idle) {
3739*4882a593Smuzhiyun kbase_jm_idle_ctx(kbdev, kctx);
3740*4882a593Smuzhiyun spin_unlock_irqrestore(
3741*4882a593Smuzhiyun &kbdev->hwaccess_lock,
3742*4882a593Smuzhiyun flags);
3743*4882a593Smuzhiyun WARN_ON(!kbase_ctx_flag(kctx, KCTX_ACTIVE));
3744*4882a593Smuzhiyun kbase_ctx_flag_clear(kctx, KCTX_ACTIVE);
3745*4882a593Smuzhiyun kbase_pm_context_idle(kbdev);
3746*4882a593Smuzhiyun } else {
3747*4882a593Smuzhiyun spin_unlock_irqrestore(
3748*4882a593Smuzhiyun &kbdev->hwaccess_lock,
3749*4882a593Smuzhiyun flags);
3750*4882a593Smuzhiyun }
3751*4882a593Smuzhiyun mutex_unlock(
3752*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.jsctx_mutex);
3753*4882a593Smuzhiyun
3754*4882a593Smuzhiyun js_mask &= ~(1 << js);
3755*4882a593Smuzhiyun break; /* Could not run atoms on this slot */
3756*4882a593Smuzhiyun }
3757*4882a593Smuzhiyun
3758*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Push kctx %pK to back of list\n",
3759*4882a593Smuzhiyun (void *)kctx);
3760*4882a593Smuzhiyun if (kbase_js_ctx_pullable(kctx, js, true))
3761*4882a593Smuzhiyun timer_sync |=
3762*4882a593Smuzhiyun kbase_js_ctx_list_add_pullable_nolock(
3763*4882a593Smuzhiyun kctx->kbdev, kctx, js);
3764*4882a593Smuzhiyun else
3765*4882a593Smuzhiyun timer_sync |=
3766*4882a593Smuzhiyun kbase_js_ctx_list_add_unpullable_nolock(
3767*4882a593Smuzhiyun kctx->kbdev, kctx, js);
3768*4882a593Smuzhiyun
3769*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3770*4882a593Smuzhiyun mutex_unlock(&kctx->jctx.sched_info.ctx.jsctx_mutex);
3771*4882a593Smuzhiyun }
3772*4882a593Smuzhiyun }
3773*4882a593Smuzhiyun
3774*4882a593Smuzhiyun if (timer_sync)
3775*4882a593Smuzhiyun kbase_js_sync_timers(kbdev);
3776*4882a593Smuzhiyun
3777*4882a593Smuzhiyun for (js = 0; js < BASE_JM_MAX_NR_SLOTS; js++) {
3778*4882a593Smuzhiyun if (kbdev->hwaccess.active_kctx[js] == last_active[js] &&
3779*4882a593Smuzhiyun ctx_waiting[js]) {
3780*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Marking kctx %pK as inactive (s:%u)\n",
3781*4882a593Smuzhiyun (void *)last_active[js], js);
3782*4882a593Smuzhiyun kbdev->hwaccess.active_kctx[js] = NULL;
3783*4882a593Smuzhiyun }
3784*4882a593Smuzhiyun }
3785*4882a593Smuzhiyun
3786*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
3787*4882a593Smuzhiyun up(&js_devdata->schedule_sem);
3788*4882a593Smuzhiyun KBASE_TLSTREAM_TL_JS_SCHED_END(kbdev, 0);
3789*4882a593Smuzhiyun }
3790*4882a593Smuzhiyun
3791*4882a593Smuzhiyun void kbase_js_zap_context(struct kbase_context *kctx)
3792*4882a593Smuzhiyun {
3793*4882a593Smuzhiyun struct kbase_device *kbdev = kctx->kbdev;
3794*4882a593Smuzhiyun struct kbasep_js_device_data *js_devdata = &kbdev->js_data;
3795*4882a593Smuzhiyun struct kbasep_js_kctx_info *js_kctx_info = &kctx->jctx.sched_info;
3796*4882a593Smuzhiyun
3797*4882a593Smuzhiyun /*
3798*4882a593Smuzhiyun * Critical assumption: No more submission is possible outside of the
3799*4882a593Smuzhiyun * workqueue. This is because the OS *must* prevent U/K calls (IOCTLs)
3800*4882a593Smuzhiyun * whilst the struct kbase_context is terminating.
3801*4882a593Smuzhiyun */
3802*4882a593Smuzhiyun
3803*4882a593Smuzhiyun /* First, atomically do the following:
3804*4882a593Smuzhiyun * - mark the context as dying
3805*4882a593Smuzhiyun * - try to evict it from the queue
3806*4882a593Smuzhiyun */
3807*4882a593Smuzhiyun mutex_lock(&kctx->jctx.lock);
3808*4882a593Smuzhiyun mutex_lock(&js_devdata->queue_mutex);
3809*4882a593Smuzhiyun mutex_lock(&js_kctx_info->ctx.jsctx_mutex);
3810*4882a593Smuzhiyun kbase_ctx_flag_set(kctx, KCTX_DYING);
3811*4882a593Smuzhiyun
3812*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Zap: Try Evict Ctx %pK", kctx);
3813*4882a593Smuzhiyun
3814*4882a593Smuzhiyun /*
3815*4882a593Smuzhiyun * At this point we know:
3816*4882a593Smuzhiyun * - If eviction succeeded, it was in the queue, but now no
3817*4882a593Smuzhiyun * longer is
3818*4882a593Smuzhiyun * - We must cancel the jobs here. No Power Manager active reference to
3819*4882a593Smuzhiyun * release.
3820*4882a593Smuzhiyun * - This happens asynchronously - kbase_jd_zap_context() will wait for
3821*4882a593Smuzhiyun * those jobs to be killed.
3822*4882a593Smuzhiyun * - If eviction failed, then it wasn't in the queue. It is one
3823*4882a593Smuzhiyun * of the following:
3824*4882a593Smuzhiyun * - a. it didn't have any jobs, and so is not in the Queue or
3825*4882a593Smuzhiyun * the Run Pool (not scheduled)
3826*4882a593Smuzhiyun * - Hence, no more work required to cancel jobs. No Power Manager
3827*4882a593Smuzhiyun * active reference to release.
3828*4882a593Smuzhiyun * - b. it was in the middle of a scheduling transaction (and thus must
3829*4882a593Smuzhiyun * have at least 1 job). This can happen from a syscall or a
3830*4882a593Smuzhiyun * kernel thread. We still hold the jsctx_mutex, and so the thread
3831*4882a593Smuzhiyun * must be waiting inside kbasep_js_try_schedule_head_ctx(),
3832*4882a593Smuzhiyun * before checking whether the runpool is full. That thread will
3833*4882a593Smuzhiyun * continue after we drop the mutex, and will notice the context
3834*4882a593Smuzhiyun * is dying. It will rollback the transaction, killing all jobs at
3835*4882a593Smuzhiyun * the same time. kbase_jd_zap_context() will wait for those jobs
3836*4882a593Smuzhiyun * to be killed.
3837*4882a593Smuzhiyun * - Hence, no more work required to cancel jobs, or to release the
3838*4882a593Smuzhiyun * Power Manager active reference.
3839*4882a593Smuzhiyun * - c. it is scheduled, and may or may not be running jobs
3840*4882a593Smuzhiyun * - We must cause it to leave the runpool by stopping it from
3841*4882a593Smuzhiyun * submitting any more jobs. When it finally does leave,
3842*4882a593Smuzhiyun * kbasep_js_runpool_requeue_or_kill_ctx() will kill all remaining jobs
3843*4882a593Smuzhiyun * (because it is dying), release the Power Manager active reference,
3844*4882a593Smuzhiyun * and will not requeue the context in the queue.
3845*4882a593Smuzhiyun * kbase_jd_zap_context() will wait for those jobs to be killed.
3846*4882a593Smuzhiyun * - Hence, work required just to make it leave the runpool. Cancelling
3847*4882a593Smuzhiyun * jobs and releasing the Power manager active reference will be
3848*4882a593Smuzhiyun * handled when it leaves the runpool.
3849*4882a593Smuzhiyun */
3850*4882a593Smuzhiyun if (!kbase_ctx_flag(kctx, KCTX_SCHEDULED)) {
3851*4882a593Smuzhiyun unsigned long flags;
3852*4882a593Smuzhiyun unsigned int js;
3853*4882a593Smuzhiyun
3854*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3855*4882a593Smuzhiyun for (js = 0; js < kbdev->gpu_props.num_job_slots; js++) {
3856*4882a593Smuzhiyun if (!list_empty(
3857*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.ctx_list_entry[js]))
3858*4882a593Smuzhiyun list_del_init(
3859*4882a593Smuzhiyun &kctx->jctx.sched_info.ctx.ctx_list_entry[js]);
3860*4882a593Smuzhiyun }
3861*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3862*4882a593Smuzhiyun
3863*4882a593Smuzhiyun /* The following events require us to kill off remaining jobs
3864*4882a593Smuzhiyun * and update PM book-keeping:
3865*4882a593Smuzhiyun * - we evicted it correctly (it must have jobs to be in the
3866*4882a593Smuzhiyun * Queue)
3867*4882a593Smuzhiyun *
3868*4882a593Smuzhiyun * These events need no action, but take this path anyway:
3869*4882a593Smuzhiyun * - Case a: it didn't have any jobs, and was never in the Queue
3870*4882a593Smuzhiyun * - Case b: scheduling transaction will be partially rolled-
3871*4882a593Smuzhiyun * back (this already cancels the jobs)
3872*4882a593Smuzhiyun */
3873*4882a593Smuzhiyun
3874*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM(kbdev, JM_ZAP_NON_SCHEDULED, kctx, NULL, 0u, kbase_ctx_flag(kctx, KCTX_SCHEDULED));
3875*4882a593Smuzhiyun
3876*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Zap: Ctx %pK scheduled=0", kctx);
3877*4882a593Smuzhiyun
3878*4882a593Smuzhiyun /* Only cancel jobs when we evicted from the
3879*4882a593Smuzhiyun * queue. No Power Manager active reference was held.
3880*4882a593Smuzhiyun *
3881*4882a593Smuzhiyun * Having is_dying set ensures that this kills, and doesn't
3882*4882a593Smuzhiyun * requeue
3883*4882a593Smuzhiyun */
3884*4882a593Smuzhiyun kbasep_js_runpool_requeue_or_kill_ctx(kbdev, kctx, false);
3885*4882a593Smuzhiyun
3886*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
3887*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
3888*4882a593Smuzhiyun mutex_unlock(&kctx->jctx.lock);
3889*4882a593Smuzhiyun } else {
3890*4882a593Smuzhiyun unsigned long flags;
3891*4882a593Smuzhiyun bool was_retained;
3892*4882a593Smuzhiyun CSTD_UNUSED(was_retained);
3893*4882a593Smuzhiyun
3894*4882a593Smuzhiyun /* Case c: didn't evict, but it is scheduled - it's in the Run
3895*4882a593Smuzhiyun * Pool
3896*4882a593Smuzhiyun */
3897*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM(kbdev, JM_ZAP_SCHEDULED, kctx, NULL, 0u, kbase_ctx_flag(kctx, KCTX_SCHEDULED));
3898*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Zap: Ctx %pK is in RunPool", kctx);
3899*4882a593Smuzhiyun
3900*4882a593Smuzhiyun /* Disable the ctx from submitting any more jobs */
3901*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3902*4882a593Smuzhiyun
3903*4882a593Smuzhiyun kbasep_js_clear_submit_allowed(js_devdata, kctx);
3904*4882a593Smuzhiyun
3905*4882a593Smuzhiyun /* Retain and (later) release the context whilst it is now
3906*4882a593Smuzhiyun * disallowed from submitting jobs - ensures that someone
3907*4882a593Smuzhiyun * somewhere will be removing the context later on
3908*4882a593Smuzhiyun */
3909*4882a593Smuzhiyun was_retained = kbase_ctx_sched_inc_refcount_nolock(kctx);
3910*4882a593Smuzhiyun
3911*4882a593Smuzhiyun /* Since it's scheduled and we have the jsctx_mutex, it must be
3912*4882a593Smuzhiyun * retained successfully
3913*4882a593Smuzhiyun */
3914*4882a593Smuzhiyun KBASE_DEBUG_ASSERT(was_retained);
3915*4882a593Smuzhiyun
3916*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Zap: Ctx %pK Kill Any Running jobs", kctx);
3917*4882a593Smuzhiyun
3918*4882a593Smuzhiyun /* Cancel any remaining running jobs for this kctx - if any.
3919*4882a593Smuzhiyun * Submit is disallowed which takes effect immediately, so no
3920*4882a593Smuzhiyun * more new jobs will appear after we do this.
3921*4882a593Smuzhiyun */
3922*4882a593Smuzhiyun kbase_backend_jm_kill_running_jobs_from_kctx(kctx);
3923*4882a593Smuzhiyun
3924*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3925*4882a593Smuzhiyun mutex_unlock(&js_kctx_info->ctx.jsctx_mutex);
3926*4882a593Smuzhiyun mutex_unlock(&js_devdata->queue_mutex);
3927*4882a593Smuzhiyun mutex_unlock(&kctx->jctx.lock);
3928*4882a593Smuzhiyun
3929*4882a593Smuzhiyun dev_dbg(kbdev->dev, "Zap: Ctx %pK Release (may or may not schedule out immediately)",
3930*4882a593Smuzhiyun kctx);
3931*4882a593Smuzhiyun
3932*4882a593Smuzhiyun kbasep_js_runpool_release_ctx(kbdev, kctx);
3933*4882a593Smuzhiyun }
3934*4882a593Smuzhiyun
3935*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM(kbdev, JM_ZAP_DONE, kctx, NULL, 0u, 0u);
3936*4882a593Smuzhiyun
3937*4882a593Smuzhiyun /* After this, you must wait on both the
3938*4882a593Smuzhiyun * kbase_jd_context::zero_jobs_wait and the
3939*4882a593Smuzhiyun * kbasep_js_kctx_info::ctx::is_scheduled_waitq - to wait for the jobs
3940*4882a593Smuzhiyun * to be destroyed, and the context to be de-scheduled (if it was on the
3941*4882a593Smuzhiyun * runpool).
3942*4882a593Smuzhiyun *
3943*4882a593Smuzhiyun * kbase_jd_zap_context() will do this.
3944*4882a593Smuzhiyun */
3945*4882a593Smuzhiyun }
3946*4882a593Smuzhiyun
3947*4882a593Smuzhiyun static inline int trace_get_refcnt(struct kbase_device *kbdev,
3948*4882a593Smuzhiyun struct kbase_context *kctx)
3949*4882a593Smuzhiyun {
3950*4882a593Smuzhiyun return atomic_read(&kctx->refcount);
3951*4882a593Smuzhiyun }
3952*4882a593Smuzhiyun
3953*4882a593Smuzhiyun /**
3954*4882a593Smuzhiyun * kbase_js_foreach_ctx_job(): - Call a function on all jobs in context
3955*4882a593Smuzhiyun * @kctx: Pointer to context.
3956*4882a593Smuzhiyun * @callback: Pointer to function to call for each job.
3957*4882a593Smuzhiyun *
3958*4882a593Smuzhiyun * Call a function on all jobs belonging to a non-queued, non-running
3959*4882a593Smuzhiyun * context, and detach the jobs from the context as it goes.
3960*4882a593Smuzhiyun *
3961*4882a593Smuzhiyun * Due to the locks that might be held at the time of the call, the callback
3962*4882a593Smuzhiyun * may need to defer work on a workqueue to complete its actions (e.g. when
3963*4882a593Smuzhiyun * cancelling jobs)
3964*4882a593Smuzhiyun *
3965*4882a593Smuzhiyun * Atoms will be removed from the queue, so this must only be called when
3966*4882a593Smuzhiyun * cancelling jobs (which occurs as part of context destruction).
3967*4882a593Smuzhiyun *
3968*4882a593Smuzhiyun * The locking conditions on the caller are as follows:
3969*4882a593Smuzhiyun * - it will be holding kbasep_js_kctx_info::ctx::jsctx_mutex.
3970*4882a593Smuzhiyun */
3971*4882a593Smuzhiyun static void kbase_js_foreach_ctx_job(struct kbase_context *kctx,
3972*4882a593Smuzhiyun kbasep_js_ctx_job_cb *callback)
3973*4882a593Smuzhiyun {
3974*4882a593Smuzhiyun struct kbase_device *kbdev;
3975*4882a593Smuzhiyun unsigned long flags;
3976*4882a593Smuzhiyun unsigned int js;
3977*4882a593Smuzhiyun
3978*4882a593Smuzhiyun kbdev = kctx->kbdev;
3979*4882a593Smuzhiyun
3980*4882a593Smuzhiyun spin_lock_irqsave(&kbdev->hwaccess_lock, flags);
3981*4882a593Smuzhiyun
3982*4882a593Smuzhiyun KBASE_KTRACE_ADD_JM_REFCOUNT(kbdev, JS_POLICY_FOREACH_CTX_JOBS, kctx, NULL,
3983*4882a593Smuzhiyun 0u, trace_get_refcnt(kbdev, kctx));
3984*4882a593Smuzhiyun
3985*4882a593Smuzhiyun /* Invoke callback on jobs on each slot in turn */
3986*4882a593Smuzhiyun for (js = 0; js < kbdev->gpu_props.num_job_slots; js++)
3987*4882a593Smuzhiyun jsctx_queue_foreach(kctx, js, callback);
3988*4882a593Smuzhiyun
3989*4882a593Smuzhiyun spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags);
3990*4882a593Smuzhiyun }
3991*4882a593Smuzhiyun
3992*4882a593Smuzhiyun base_jd_prio kbase_js_priority_check(struct kbase_device *kbdev, base_jd_prio priority)
3993*4882a593Smuzhiyun {
3994*4882a593Smuzhiyun struct priority_control_manager_device *pcm_device = kbdev->pcm_dev;
3995*4882a593Smuzhiyun int req_priority, out_priority;
3996*4882a593Smuzhiyun
3997*4882a593Smuzhiyun req_priority = kbasep_js_atom_prio_to_sched_prio(priority);
3998*4882a593Smuzhiyun out_priority = req_priority;
3999*4882a593Smuzhiyun /* Does not use pcm defined priority check if PCM not defined or if
4000*4882a593Smuzhiyun * kbasep_js_atom_prio_to_sched_prio returns an error
4001*4882a593Smuzhiyun * (KBASE_JS_ATOM_SCHED_PRIO_INVALID).
4002*4882a593Smuzhiyun */
4003*4882a593Smuzhiyun if (pcm_device && (req_priority != KBASE_JS_ATOM_SCHED_PRIO_INVALID))
4004*4882a593Smuzhiyun out_priority = pcm_device->ops.pcm_scheduler_priority_check(pcm_device, current,
4005*4882a593Smuzhiyun req_priority);
4006*4882a593Smuzhiyun return kbasep_js_sched_prio_to_atom_prio(kbdev, out_priority);
4007*4882a593Smuzhiyun }
4008