]>
Commit | Line | Data |
---|---|---|
fab97220 HS |
1 | /* |
2 | * IBM eServer eHCA Infiniband device driver for Linux on POWER | |
3 | * | |
4 | * Functions for EQs, NEQs and interrupts | |
5 | * | |
6 | * Authors: Heiko J Schick <schickhj@de.ibm.com> | |
7 | * Khadija Souissi <souissi@de.ibm.com> | |
8 | * | |
9 | * Copyright (c) 2005 IBM Corporation | |
10 | * | |
11 | * All rights reserved. | |
12 | * | |
13 | * This source code is distributed under a dual license of GPL v2.0 and OpenIB | |
14 | * BSD. | |
15 | * | |
16 | * OpenIB BSD License | |
17 | * | |
18 | * Redistribution and use in source and binary forms, with or without | |
19 | * modification, are permitted provided that the following conditions are met: | |
20 | * | |
21 | * Redistributions of source code must retain the above copyright notice, this | |
22 | * list of conditions and the following disclaimer. | |
23 | * | |
24 | * Redistributions in binary form must reproduce the above copyright notice, | |
25 | * this list of conditions and the following disclaimer in the documentation | |
26 | * and/or other materials | |
27 | * provided with the distribution. | |
28 | * | |
29 | * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | |
30 | * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
31 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | |
32 | * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE | |
33 | * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | |
34 | * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | |
35 | * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR | |
36 | * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER | |
37 | * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | |
38 | * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | |
39 | * POSSIBILITY OF SUCH DAMAGE. | |
40 | */ | |
41 | ||
42 | #include "ehca_classes.h" | |
43 | #include "ehca_irq.h" | |
44 | #include "ehca_iverbs.h" | |
45 | #include "ehca_tools.h" | |
46 | #include "hcp_if.h" | |
47 | #include "hipz_fns.h" | |
7e28db5d | 48 | #include "ipz_pt_fn.h" |
fab97220 HS |
49 | |
50 | #define EQE_COMPLETION_EVENT EHCA_BMASK_IBM(1,1) | |
51 | #define EQE_CQ_QP_NUMBER EHCA_BMASK_IBM(8,31) | |
52 | #define EQE_EE_IDENTIFIER EHCA_BMASK_IBM(2,7) | |
53 | #define EQE_CQ_NUMBER EHCA_BMASK_IBM(8,31) | |
54 | #define EQE_QP_NUMBER EHCA_BMASK_IBM(8,31) | |
55 | #define EQE_QP_TOKEN EHCA_BMASK_IBM(32,63) | |
56 | #define EQE_CQ_TOKEN EHCA_BMASK_IBM(32,63) | |
57 | ||
58 | #define NEQE_COMPLETION_EVENT EHCA_BMASK_IBM(1,1) | |
59 | #define NEQE_EVENT_CODE EHCA_BMASK_IBM(2,7) | |
60 | #define NEQE_PORT_NUMBER EHCA_BMASK_IBM(8,15) | |
61 | #define NEQE_PORT_AVAILABILITY EHCA_BMASK_IBM(16,16) | |
62 | ||
63 | #define ERROR_DATA_LENGTH EHCA_BMASK_IBM(52,63) | |
64 | #define ERROR_DATA_TYPE EHCA_BMASK_IBM(0,7) | |
65 | ||
66 | #ifdef CONFIG_INFINIBAND_EHCA_SCALING | |
67 | ||
68 | static void queue_comp_task(struct ehca_cq *__cq); | |
69 | ||
70 | static struct ehca_comp_pool* pool; | |
71 | static struct notifier_block comp_pool_callback_nb; | |
72 | ||
73 | #endif | |
74 | ||
75 | static inline void comp_event_callback(struct ehca_cq *cq) | |
76 | { | |
77 | if (!cq->ib_cq.comp_handler) | |
78 | return; | |
79 | ||
80 | spin_lock(&cq->cb_lock); | |
81 | cq->ib_cq.comp_handler(&cq->ib_cq, cq->ib_cq.cq_context); | |
82 | spin_unlock(&cq->cb_lock); | |
83 | ||
84 | return; | |
85 | } | |
86 | ||
87 | static void print_error_data(struct ehca_shca * shca, void* data, | |
88 | u64* rblock, int length) | |
89 | { | |
90 | u64 type = EHCA_BMASK_GET(ERROR_DATA_TYPE, rblock[2]); | |
91 | u64 resource = rblock[1]; | |
92 | ||
93 | switch (type) { | |
94 | case 0x1: /* Queue Pair */ | |
95 | { | |
96 | struct ehca_qp *qp = (struct ehca_qp*)data; | |
97 | ||
98 | /* only print error data if AER is set */ | |
99 | if (rblock[6] == 0) | |
100 | return; | |
101 | ||
102 | ehca_err(&shca->ib_device, | |
103 | "QP 0x%x (resource=%lx) has errors.", | |
104 | qp->ib_qp.qp_num, resource); | |
105 | break; | |
106 | } | |
107 | case 0x4: /* Completion Queue */ | |
108 | { | |
109 | struct ehca_cq *cq = (struct ehca_cq*)data; | |
110 | ||
111 | ehca_err(&shca->ib_device, | |
112 | "CQ 0x%x (resource=%lx) has errors.", | |
113 | cq->cq_number, resource); | |
114 | break; | |
115 | } | |
116 | default: | |
117 | ehca_err(&shca->ib_device, | |
118 | "Unknown errror type: %lx on %s.", | |
119 | type, shca->ib_device.name); | |
120 | break; | |
121 | } | |
122 | ||
123 | ehca_err(&shca->ib_device, "Error data is available: %lx.", resource); | |
124 | ehca_err(&shca->ib_device, "EHCA ----- error data begin " | |
125 | "---------------------------------------------------"); | |
126 | ehca_dmp(rblock, length, "resource=%lx", resource); | |
127 | ehca_err(&shca->ib_device, "EHCA ----- error data end " | |
128 | "----------------------------------------------------"); | |
129 | ||
130 | return; | |
131 | } | |
132 | ||
133 | int ehca_error_data(struct ehca_shca *shca, void *data, | |
134 | u64 resource) | |
135 | { | |
136 | ||
137 | unsigned long ret; | |
138 | u64 *rblock; | |
139 | unsigned long block_count; | |
140 | ||
7e28db5d | 141 | rblock = ehca_alloc_fw_ctrlblock(); |
fab97220 HS |
142 | if (!rblock) { |
143 | ehca_err(&shca->ib_device, "Cannot allocate rblock memory."); | |
144 | ret = -ENOMEM; | |
145 | goto error_data1; | |
146 | } | |
147 | ||
7e28db5d | 148 | /* rblock must be 4K aligned and should be 4K large */ |
fab97220 HS |
149 | ret = hipz_h_error_data(shca->ipz_hca_handle, |
150 | resource, | |
151 | rblock, | |
152 | &block_count); | |
153 | ||
7e28db5d | 154 | if (ret == H_R_STATE) |
fab97220 HS |
155 | ehca_err(&shca->ib_device, |
156 | "No error data is available: %lx.", resource); | |
fab97220 HS |
157 | else if (ret == H_SUCCESS) { |
158 | int length; | |
159 | ||
160 | length = EHCA_BMASK_GET(ERROR_DATA_LENGTH, rblock[0]); | |
161 | ||
7e28db5d HNN |
162 | if (length > EHCA_PAGESIZE) |
163 | length = EHCA_PAGESIZE; | |
fab97220 HS |
164 | |
165 | print_error_data(shca, data, rblock, length); | |
7e28db5d | 166 | } else |
fab97220 HS |
167 | ehca_err(&shca->ib_device, |
168 | "Error data could not be fetched: %lx", resource); | |
fab97220 | 169 | |
7e28db5d | 170 | ehca_free_fw_ctrlblock(rblock); |
fab97220 HS |
171 | |
172 | error_data1: | |
173 | return ret; | |
174 | ||
175 | } | |
176 | ||
177 | static void qp_event_callback(struct ehca_shca *shca, | |
178 | u64 eqe, | |
179 | enum ib_event_type event_type) | |
180 | { | |
181 | struct ib_event event; | |
182 | struct ehca_qp *qp; | |
183 | unsigned long flags; | |
184 | u32 token = EHCA_BMASK_GET(EQE_QP_TOKEN, eqe); | |
185 | ||
186 | spin_lock_irqsave(&ehca_qp_idr_lock, flags); | |
187 | qp = idr_find(&ehca_qp_idr, token); | |
188 | spin_unlock_irqrestore(&ehca_qp_idr_lock, flags); | |
189 | ||
190 | ||
191 | if (!qp) | |
192 | return; | |
193 | ||
194 | ehca_error_data(shca, qp, qp->ipz_qp_handle.handle); | |
195 | ||
196 | if (!qp->ib_qp.event_handler) | |
197 | return; | |
198 | ||
199 | event.device = &shca->ib_device; | |
200 | event.event = event_type; | |
201 | event.element.qp = &qp->ib_qp; | |
202 | ||
203 | qp->ib_qp.event_handler(&event, qp->ib_qp.qp_context); | |
204 | ||
205 | return; | |
206 | } | |
207 | ||
208 | static void cq_event_callback(struct ehca_shca *shca, | |
209 | u64 eqe) | |
210 | { | |
211 | struct ehca_cq *cq; | |
212 | unsigned long flags; | |
213 | u32 token = EHCA_BMASK_GET(EQE_CQ_TOKEN, eqe); | |
214 | ||
215 | spin_lock_irqsave(&ehca_cq_idr_lock, flags); | |
216 | cq = idr_find(&ehca_cq_idr, token); | |
217 | spin_unlock_irqrestore(&ehca_cq_idr_lock, flags); | |
218 | ||
219 | if (!cq) | |
220 | return; | |
221 | ||
222 | ehca_error_data(shca, cq, cq->ipz_cq_handle.handle); | |
223 | ||
224 | return; | |
225 | } | |
226 | ||
227 | static void parse_identifier(struct ehca_shca *shca, u64 eqe) | |
228 | { | |
229 | u8 identifier = EHCA_BMASK_GET(EQE_EE_IDENTIFIER, eqe); | |
230 | ||
231 | switch (identifier) { | |
232 | case 0x02: /* path migrated */ | |
233 | qp_event_callback(shca, eqe, IB_EVENT_PATH_MIG); | |
234 | break; | |
235 | case 0x03: /* communication established */ | |
236 | qp_event_callback(shca, eqe, IB_EVENT_COMM_EST); | |
237 | break; | |
238 | case 0x04: /* send queue drained */ | |
239 | qp_event_callback(shca, eqe, IB_EVENT_SQ_DRAINED); | |
240 | break; | |
241 | case 0x05: /* QP error */ | |
242 | case 0x06: /* QP error */ | |
243 | qp_event_callback(shca, eqe, IB_EVENT_QP_FATAL); | |
244 | break; | |
245 | case 0x07: /* CQ error */ | |
246 | case 0x08: /* CQ error */ | |
247 | cq_event_callback(shca, eqe); | |
248 | break; | |
249 | case 0x09: /* MRMWPTE error */ | |
250 | ehca_err(&shca->ib_device, "MRMWPTE error."); | |
251 | break; | |
252 | case 0x0A: /* port event */ | |
253 | ehca_err(&shca->ib_device, "Port event."); | |
254 | break; | |
255 | case 0x0B: /* MR access error */ | |
256 | ehca_err(&shca->ib_device, "MR access error."); | |
257 | break; | |
258 | case 0x0C: /* EQ error */ | |
259 | ehca_err(&shca->ib_device, "EQ error."); | |
260 | break; | |
261 | case 0x0D: /* P/Q_Key mismatch */ | |
262 | ehca_err(&shca->ib_device, "P/Q_Key mismatch."); | |
263 | break; | |
264 | case 0x10: /* sampling complete */ | |
265 | ehca_err(&shca->ib_device, "Sampling complete."); | |
266 | break; | |
267 | case 0x11: /* unaffiliated access error */ | |
268 | ehca_err(&shca->ib_device, "Unaffiliated access error."); | |
269 | break; | |
270 | case 0x12: /* path migrating error */ | |
271 | ehca_err(&shca->ib_device, "Path migration error."); | |
272 | break; | |
273 | case 0x13: /* interface trace stopped */ | |
274 | ehca_err(&shca->ib_device, "Interface trace stopped."); | |
275 | break; | |
276 | case 0x14: /* first error capture info available */ | |
277 | default: | |
278 | ehca_err(&shca->ib_device, "Unknown identifier: %x on %s.", | |
279 | identifier, shca->ib_device.name); | |
280 | break; | |
281 | } | |
282 | ||
283 | return; | |
284 | } | |
285 | ||
286 | static void parse_ec(struct ehca_shca *shca, u64 eqe) | |
287 | { | |
288 | struct ib_event event; | |
289 | u8 ec = EHCA_BMASK_GET(NEQE_EVENT_CODE, eqe); | |
290 | u8 port = EHCA_BMASK_GET(NEQE_PORT_NUMBER, eqe); | |
291 | ||
292 | switch (ec) { | |
293 | case 0x30: /* port availability change */ | |
294 | if (EHCA_BMASK_GET(NEQE_PORT_AVAILABILITY, eqe)) { | |
295 | ehca_info(&shca->ib_device, | |
296 | "port %x is active.", port); | |
297 | event.device = &shca->ib_device; | |
298 | event.event = IB_EVENT_PORT_ACTIVE; | |
299 | event.element.port_num = port; | |
300 | shca->sport[port - 1].port_state = IB_PORT_ACTIVE; | |
301 | ib_dispatch_event(&event); | |
302 | } else { | |
303 | ehca_info(&shca->ib_device, | |
304 | "port %x is inactive.", port); | |
305 | event.device = &shca->ib_device; | |
306 | event.event = IB_EVENT_PORT_ERR; | |
307 | event.element.port_num = port; | |
308 | shca->sport[port - 1].port_state = IB_PORT_DOWN; | |
309 | ib_dispatch_event(&event); | |
310 | } | |
311 | break; | |
312 | case 0x31: | |
313 | /* port configuration change | |
314 | * disruptive change is caused by | |
315 | * LID, PKEY or SM change | |
316 | */ | |
317 | ehca_warn(&shca->ib_device, | |
318 | "disruptive port %x configuration change", port); | |
319 | ||
320 | ehca_info(&shca->ib_device, | |
321 | "port %x is inactive.", port); | |
322 | event.device = &shca->ib_device; | |
323 | event.event = IB_EVENT_PORT_ERR; | |
324 | event.element.port_num = port; | |
325 | shca->sport[port - 1].port_state = IB_PORT_DOWN; | |
326 | ib_dispatch_event(&event); | |
327 | ||
328 | ehca_info(&shca->ib_device, | |
329 | "port %x is active.", port); | |
330 | event.device = &shca->ib_device; | |
331 | event.event = IB_EVENT_PORT_ACTIVE; | |
332 | event.element.port_num = port; | |
333 | shca->sport[port - 1].port_state = IB_PORT_ACTIVE; | |
334 | ib_dispatch_event(&event); | |
335 | break; | |
336 | case 0x32: /* adapter malfunction */ | |
337 | ehca_err(&shca->ib_device, "Adapter malfunction."); | |
338 | break; | |
339 | case 0x33: /* trace stopped */ | |
340 | ehca_err(&shca->ib_device, "Traced stopped."); | |
341 | break; | |
342 | default: | |
343 | ehca_err(&shca->ib_device, "Unknown event code: %x on %s.", | |
344 | ec, shca->ib_device.name); | |
345 | break; | |
346 | } | |
347 | ||
348 | return; | |
349 | } | |
350 | ||
351 | static inline void reset_eq_pending(struct ehca_cq *cq) | |
352 | { | |
353 | u64 CQx_EP; | |
354 | struct h_galpa gal = cq->galpas.kernel; | |
355 | ||
356 | hipz_galpa_store_cq(gal, cqx_ep, 0x0); | |
357 | CQx_EP = hipz_galpa_load(gal, CQTEMM_OFFSET(cqx_ep)); | |
358 | ||
359 | return; | |
360 | } | |
361 | ||
7d12e780 | 362 | irqreturn_t ehca_interrupt_neq(int irq, void *dev_id) |
fab97220 HS |
363 | { |
364 | struct ehca_shca *shca = (struct ehca_shca*)dev_id; | |
365 | ||
366 | tasklet_hi_schedule(&shca->neq.interrupt_task); | |
367 | ||
368 | return IRQ_HANDLED; | |
369 | } | |
370 | ||
371 | void ehca_tasklet_neq(unsigned long data) | |
372 | { | |
373 | struct ehca_shca *shca = (struct ehca_shca*)data; | |
374 | struct ehca_eqe *eqe; | |
375 | u64 ret; | |
376 | ||
377 | eqe = (struct ehca_eqe *)ehca_poll_eq(shca, &shca->neq); | |
378 | ||
379 | while (eqe) { | |
380 | if (!EHCA_BMASK_GET(NEQE_COMPLETION_EVENT, eqe->entry)) | |
381 | parse_ec(shca, eqe->entry); | |
382 | ||
383 | eqe = (struct ehca_eqe *)ehca_poll_eq(shca, &shca->neq); | |
384 | } | |
385 | ||
386 | ret = hipz_h_reset_event(shca->ipz_hca_handle, | |
387 | shca->neq.ipz_eq_handle, 0xFFFFFFFFFFFFFFFFL); | |
388 | ||
389 | if (ret != H_SUCCESS) | |
390 | ehca_err(&shca->ib_device, "Can't clear notification events."); | |
391 | ||
392 | return; | |
393 | } | |
394 | ||
7d12e780 | 395 | irqreturn_t ehca_interrupt_eq(int irq, void *dev_id) |
fab97220 HS |
396 | { |
397 | struct ehca_shca *shca = (struct ehca_shca*)dev_id; | |
398 | ||
399 | tasklet_hi_schedule(&shca->eq.interrupt_task); | |
400 | ||
401 | return IRQ_HANDLED; | |
402 | } | |
403 | ||
404 | void ehca_tasklet_eq(unsigned long data) | |
405 | { | |
406 | struct ehca_shca *shca = (struct ehca_shca*)data; | |
407 | struct ehca_eqe *eqe; | |
408 | int int_state; | |
409 | int query_cnt = 0; | |
410 | ||
411 | do { | |
412 | eqe = (struct ehca_eqe *)ehca_poll_eq(shca, &shca->eq); | |
413 | ||
414 | if ((shca->hw_level >= 2) && eqe) | |
415 | int_state = 1; | |
416 | else | |
417 | int_state = 0; | |
418 | ||
419 | while ((int_state == 1) || eqe) { | |
420 | while (eqe) { | |
421 | u64 eqe_value = eqe->entry; | |
422 | ||
423 | ehca_dbg(&shca->ib_device, | |
424 | "eqe_value=%lx", eqe_value); | |
425 | ||
426 | /* TODO: better structure */ | |
427 | if (EHCA_BMASK_GET(EQE_COMPLETION_EVENT, | |
428 | eqe_value)) { | |
429 | unsigned long flags; | |
430 | u32 token; | |
431 | struct ehca_cq *cq; | |
432 | ||
433 | ehca_dbg(&shca->ib_device, | |
434 | "... completion event"); | |
435 | token = | |
436 | EHCA_BMASK_GET(EQE_CQ_TOKEN, | |
437 | eqe_value); | |
438 | spin_lock_irqsave(&ehca_cq_idr_lock, | |
439 | flags); | |
440 | cq = idr_find(&ehca_cq_idr, token); | |
441 | ||
442 | if (cq == NULL) { | |
443 | spin_unlock(&ehca_cq_idr_lock); | |
444 | break; | |
445 | } | |
446 | ||
447 | reset_eq_pending(cq); | |
448 | #ifdef CONFIG_INFINIBAND_EHCA_SCALING | |
449 | queue_comp_task(cq); | |
450 | spin_unlock_irqrestore(&ehca_cq_idr_lock, | |
451 | flags); | |
452 | #else | |
453 | spin_unlock_irqrestore(&ehca_cq_idr_lock, | |
454 | flags); | |
455 | comp_event_callback(cq); | |
456 | #endif | |
457 | } else { | |
458 | ehca_dbg(&shca->ib_device, | |
459 | "... non completion event"); | |
460 | parse_identifier(shca, eqe_value); | |
461 | } | |
462 | eqe = | |
463 | (struct ehca_eqe *)ehca_poll_eq(shca, | |
464 | &shca->eq); | |
465 | } | |
466 | ||
467 | if (shca->hw_level >= 2) { | |
468 | int_state = | |
469 | hipz_h_query_int_state(shca->ipz_hca_handle, | |
470 | shca->eq.ist); | |
471 | query_cnt++; | |
472 | iosync(); | |
473 | if (query_cnt >= 100) { | |
474 | query_cnt = 0; | |
475 | int_state = 0; | |
476 | } | |
477 | } | |
478 | eqe = (struct ehca_eqe *)ehca_poll_eq(shca, &shca->eq); | |
479 | ||
480 | } | |
481 | } while (int_state != 0); | |
482 | ||
483 | return; | |
484 | } | |
485 | ||
486 | #ifdef CONFIG_INFINIBAND_EHCA_SCALING | |
487 | ||
488 | static inline int find_next_online_cpu(struct ehca_comp_pool* pool) | |
489 | { | |
490 | unsigned long flags_last_cpu; | |
491 | ||
492 | if (ehca_debug_level) | |
493 | ehca_dmp(&cpu_online_map, sizeof(cpumask_t), ""); | |
494 | ||
495 | spin_lock_irqsave(&pool->last_cpu_lock, flags_last_cpu); | |
496 | pool->last_cpu = next_cpu(pool->last_cpu, cpu_online_map); | |
497 | if (pool->last_cpu == NR_CPUS) | |
498 | pool->last_cpu = first_cpu(cpu_online_map); | |
499 | spin_unlock_irqrestore(&pool->last_cpu_lock, flags_last_cpu); | |
500 | ||
501 | return pool->last_cpu; | |
502 | } | |
503 | ||
504 | static void __queue_comp_task(struct ehca_cq *__cq, | |
505 | struct ehca_cpu_comp_task *cct) | |
506 | { | |
507 | unsigned long flags_cct; | |
508 | unsigned long flags_cq; | |
509 | ||
510 | spin_lock_irqsave(&cct->task_lock, flags_cct); | |
511 | spin_lock_irqsave(&__cq->task_lock, flags_cq); | |
512 | ||
513 | if (__cq->nr_callbacks == 0) { | |
514 | __cq->nr_callbacks++; | |
515 | list_add_tail(&__cq->entry, &cct->cq_list); | |
516 | cct->cq_jobs++; | |
517 | wake_up(&cct->wait_queue); | |
518 | } | |
519 | else | |
520 | __cq->nr_callbacks++; | |
521 | ||
522 | spin_unlock_irqrestore(&__cq->task_lock, flags_cq); | |
523 | spin_unlock_irqrestore(&cct->task_lock, flags_cct); | |
524 | } | |
525 | ||
526 | static void queue_comp_task(struct ehca_cq *__cq) | |
527 | { | |
528 | int cpu; | |
529 | int cpu_id; | |
530 | struct ehca_cpu_comp_task *cct; | |
531 | ||
532 | cpu = get_cpu(); | |
533 | cpu_id = find_next_online_cpu(pool); | |
534 | ||
535 | BUG_ON(!cpu_online(cpu_id)); | |
536 | ||
537 | cct = per_cpu_ptr(pool->cpu_comp_tasks, cpu_id); | |
538 | ||
539 | if (cct->cq_jobs > 0) { | |
540 | cpu_id = find_next_online_cpu(pool); | |
541 | cct = per_cpu_ptr(pool->cpu_comp_tasks, cpu_id); | |
542 | } | |
543 | ||
544 | __queue_comp_task(__cq, cct); | |
545 | ||
546 | put_cpu(); | |
547 | ||
548 | return; | |
549 | } | |
550 | ||
551 | static void run_comp_task(struct ehca_cpu_comp_task* cct) | |
552 | { | |
553 | struct ehca_cq *cq; | |
554 | unsigned long flags_cct; | |
555 | unsigned long flags_cq; | |
556 | ||
557 | spin_lock_irqsave(&cct->task_lock, flags_cct); | |
558 | ||
559 | while (!list_empty(&cct->cq_list)) { | |
560 | cq = list_entry(cct->cq_list.next, struct ehca_cq, entry); | |
561 | spin_unlock_irqrestore(&cct->task_lock, flags_cct); | |
562 | comp_event_callback(cq); | |
563 | spin_lock_irqsave(&cct->task_lock, flags_cct); | |
564 | ||
565 | spin_lock_irqsave(&cq->task_lock, flags_cq); | |
566 | cq->nr_callbacks--; | |
567 | if (cq->nr_callbacks == 0) { | |
568 | list_del_init(cct->cq_list.next); | |
569 | cct->cq_jobs--; | |
570 | } | |
571 | spin_unlock_irqrestore(&cq->task_lock, flags_cq); | |
572 | ||
573 | } | |
574 | ||
575 | spin_unlock_irqrestore(&cct->task_lock, flags_cct); | |
576 | ||
577 | return; | |
578 | } | |
579 | ||
580 | static int comp_task(void *__cct) | |
581 | { | |
582 | struct ehca_cpu_comp_task* cct = __cct; | |
583 | DECLARE_WAITQUEUE(wait, current); | |
584 | ||
585 | set_current_state(TASK_INTERRUPTIBLE); | |
586 | while(!kthread_should_stop()) { | |
587 | add_wait_queue(&cct->wait_queue, &wait); | |
588 | ||
589 | if (list_empty(&cct->cq_list)) | |
590 | schedule(); | |
591 | else | |
592 | __set_current_state(TASK_RUNNING); | |
593 | ||
594 | remove_wait_queue(&cct->wait_queue, &wait); | |
595 | ||
596 | if (!list_empty(&cct->cq_list)) | |
597 | run_comp_task(__cct); | |
598 | ||
599 | set_current_state(TASK_INTERRUPTIBLE); | |
600 | } | |
601 | __set_current_state(TASK_RUNNING); | |
602 | ||
603 | return 0; | |
604 | } | |
605 | ||
606 | static struct task_struct *create_comp_task(struct ehca_comp_pool *pool, | |
607 | int cpu) | |
608 | { | |
609 | struct ehca_cpu_comp_task *cct; | |
610 | ||
611 | cct = per_cpu_ptr(pool->cpu_comp_tasks, cpu); | |
612 | spin_lock_init(&cct->task_lock); | |
613 | INIT_LIST_HEAD(&cct->cq_list); | |
614 | init_waitqueue_head(&cct->wait_queue); | |
615 | cct->task = kthread_create(comp_task, cct, "ehca_comp/%d", cpu); | |
616 | ||
617 | return cct->task; | |
618 | } | |
619 | ||
620 | static void destroy_comp_task(struct ehca_comp_pool *pool, | |
621 | int cpu) | |
622 | { | |
623 | struct ehca_cpu_comp_task *cct; | |
624 | struct task_struct *task; | |
625 | unsigned long flags_cct; | |
626 | ||
627 | cct = per_cpu_ptr(pool->cpu_comp_tasks, cpu); | |
628 | ||
629 | spin_lock_irqsave(&cct->task_lock, flags_cct); | |
630 | ||
631 | task = cct->task; | |
632 | cct->task = NULL; | |
633 | cct->cq_jobs = 0; | |
634 | ||
635 | spin_unlock_irqrestore(&cct->task_lock, flags_cct); | |
636 | ||
637 | if (task) | |
638 | kthread_stop(task); | |
639 | ||
640 | return; | |
641 | } | |
642 | ||
643 | static void take_over_work(struct ehca_comp_pool *pool, | |
644 | int cpu) | |
645 | { | |
646 | struct ehca_cpu_comp_task *cct = per_cpu_ptr(pool->cpu_comp_tasks, cpu); | |
647 | LIST_HEAD(list); | |
648 | struct ehca_cq *cq; | |
649 | unsigned long flags_cct; | |
650 | ||
651 | spin_lock_irqsave(&cct->task_lock, flags_cct); | |
652 | ||
653 | list_splice_init(&cct->cq_list, &list); | |
654 | ||
655 | while(!list_empty(&list)) { | |
656 | cq = list_entry(cct->cq_list.next, struct ehca_cq, entry); | |
657 | ||
658 | list_del(&cq->entry); | |
659 | __queue_comp_task(cq, per_cpu_ptr(pool->cpu_comp_tasks, | |
660 | smp_processor_id())); | |
661 | } | |
662 | ||
663 | spin_unlock_irqrestore(&cct->task_lock, flags_cct); | |
664 | ||
665 | } | |
666 | ||
667 | static int comp_pool_callback(struct notifier_block *nfb, | |
668 | unsigned long action, | |
669 | void *hcpu) | |
670 | { | |
671 | unsigned int cpu = (unsigned long)hcpu; | |
672 | struct ehca_cpu_comp_task *cct; | |
673 | ||
674 | switch (action) { | |
675 | case CPU_UP_PREPARE: | |
676 | ehca_gen_dbg("CPU: %x (CPU_PREPARE)", cpu); | |
677 | if(!create_comp_task(pool, cpu)) { | |
678 | ehca_gen_err("Can't create comp_task for cpu: %x", cpu); | |
679 | return NOTIFY_BAD; | |
680 | } | |
681 | break; | |
682 | case CPU_UP_CANCELED: | |
683 | ehca_gen_dbg("CPU: %x (CPU_CANCELED)", cpu); | |
684 | cct = per_cpu_ptr(pool->cpu_comp_tasks, cpu); | |
685 | kthread_bind(cct->task, any_online_cpu(cpu_online_map)); | |
686 | destroy_comp_task(pool, cpu); | |
687 | break; | |
688 | case CPU_ONLINE: | |
689 | ehca_gen_dbg("CPU: %x (CPU_ONLINE)", cpu); | |
690 | cct = per_cpu_ptr(pool->cpu_comp_tasks, cpu); | |
691 | kthread_bind(cct->task, cpu); | |
692 | wake_up_process(cct->task); | |
693 | break; | |
694 | case CPU_DOWN_PREPARE: | |
695 | ehca_gen_dbg("CPU: %x (CPU_DOWN_PREPARE)", cpu); | |
696 | break; | |
697 | case CPU_DOWN_FAILED: | |
698 | ehca_gen_dbg("CPU: %x (CPU_DOWN_FAILED)", cpu); | |
699 | break; | |
700 | case CPU_DEAD: | |
701 | ehca_gen_dbg("CPU: %x (CPU_DEAD)", cpu); | |
702 | destroy_comp_task(pool, cpu); | |
703 | take_over_work(pool, cpu); | |
704 | break; | |
705 | } | |
706 | ||
707 | return NOTIFY_OK; | |
708 | } | |
709 | ||
710 | #endif | |
711 | ||
712 | int ehca_create_comp_pool(void) | |
713 | { | |
714 | #ifdef CONFIG_INFINIBAND_EHCA_SCALING | |
715 | int cpu; | |
716 | struct task_struct *task; | |
717 | ||
718 | pool = kzalloc(sizeof(struct ehca_comp_pool), GFP_KERNEL); | |
719 | if (pool == NULL) | |
720 | return -ENOMEM; | |
721 | ||
722 | spin_lock_init(&pool->last_cpu_lock); | |
723 | pool->last_cpu = any_online_cpu(cpu_online_map); | |
724 | ||
725 | pool->cpu_comp_tasks = alloc_percpu(struct ehca_cpu_comp_task); | |
726 | if (pool->cpu_comp_tasks == NULL) { | |
727 | kfree(pool); | |
728 | return -EINVAL; | |
729 | } | |
730 | ||
731 | for_each_online_cpu(cpu) { | |
732 | task = create_comp_task(pool, cpu); | |
733 | if (task) { | |
734 | kthread_bind(task, cpu); | |
735 | wake_up_process(task); | |
736 | } | |
737 | } | |
738 | ||
739 | comp_pool_callback_nb.notifier_call = comp_pool_callback; | |
740 | comp_pool_callback_nb.priority =0; | |
741 | register_cpu_notifier(&comp_pool_callback_nb); | |
742 | #endif | |
743 | ||
744 | return 0; | |
745 | } | |
746 | ||
747 | void ehca_destroy_comp_pool(void) | |
748 | { | |
749 | #ifdef CONFIG_INFINIBAND_EHCA_SCALING | |
750 | int i; | |
751 | ||
752 | unregister_cpu_notifier(&comp_pool_callback_nb); | |
753 | ||
754 | for (i = 0; i < NR_CPUS; i++) { | |
755 | if (cpu_online(i)) | |
756 | destroy_comp_task(pool, i); | |
757 | } | |
758 | #endif | |
759 | ||
760 | return; | |
761 | } |