block: do not merge requests without consulting with io scheduler

[mirror_ubuntu-artful-kernel.git] / block / cfq-iosched.c
diff --git a/block/cfq-iosched.c b/block/cfq-iosched.c

index 9c2e82c1ea880530b367101cf47ef0fc225eed4d..acabba198de936cd9fc4b2e679947fb526c9c0f1 100644 (file)
--- a/block/cfq-iosched.c
+++ b/block/cfq-iosched.c
@@ -132,7 +132,7 @@ struct cfq_queue {
         /* time when first request from queue completed and slice started. */
         u64 slice_start;
         u64 slice_end;
-       u64 slice_resid;
+       s64 slice_resid;
  
         /* pending priority requests */
         int prio_pending;
@@ -141,7 +141,7 @@ struct cfq_queue {
  
         /* io prio of this group */
         unsigned short ioprio, org_ioprio;
-       unsigned short ioprio_class;
+       unsigned short ioprio_class, org_ioprio_class;
  
         pid_t pid;
  
@@ -362,7 +362,7 @@ struct cfq_data {
         /*
          * idle window management
          */
-       struct timer_list idle_slice_timer;
+       struct hrtimer idle_slice_timer;
         struct work_struct unplug_work;
  
         struct cfq_queue *active_queue;
@@ -1463,7 +1463,8 @@ static inline u64 cfq_cfqq_slice_usage(struct cfq_queue *cfqq,
                  * a single request on seeky media and cause lots of seek time
                  * and group will never know it.
                  */
-               slice_used = max_t(u64, (now - cfqq->dispatch_start), 1);
+               slice_used = max_t(u64, (now - cfqq->dispatch_start),
+                                       jiffies_to_nsecs(1));
         } else {
                 slice_used = now - cfqq->slice_start;
                 if (slice_used > cfqq->allocated_slice) {
@@ -2543,7 +2544,7 @@ static int cfq_merge(struct request_queue *q, struct request **req,
         struct request *__rq;
  
         __rq = cfq_find_rq_fmerge(cfqd, bio);
-       if (__rq && elv_rq_merge_ok(__rq, bio)) {
+       if (__rq && elv_bio_merge_ok(__rq, bio)) {
                 *req = __rq;
                 return ELEVATOR_FRONT_MERGE;
         }
@@ -2600,8 +2601,8 @@ cfq_merged_requests(struct request_queue *q, struct request *rq,
                 cfq_del_cfqq_rr(cfqd, cfqq);
  }
  
-static int cfq_allow_merge(struct request_queue *q, struct request *rq,
-                          struct bio *bio)
+static int cfq_allow_bio_merge(struct request_queue *q, struct request *rq,
+                              struct bio *bio)
  {
         struct cfq_data *cfqd = q->elevator->elevator_data;
         struct cfq_io_cq *cic;
@@ -2625,9 +2626,15 @@ static int cfq_allow_merge(struct request_queue *q, struct request *rq,
         return cfqq == RQ_CFQQ(rq);
  }
  
+static int cfq_allow_rq_merge(struct request_queue *q, struct request *rq,
+                             struct request *next)
+{
+       return RQ_CFQQ(rq) == RQ_CFQQ(next);
+}
+
  static inline void cfq_del_timer(struct cfq_data *cfqd, struct cfq_queue *cfqq)
  {
-       del_timer(&cfqd->idle_slice_timer);
+       hrtimer_try_to_cancel(&cfqd->idle_slice_timer);
         cfqg_stats_update_idle_time(cfqq->cfqg);
  }
  
@@ -2689,7 +2696,7 @@ __cfq_slice_expired(struct cfq_data *cfqd, struct cfq_queue *cfqq,
                         cfqq->slice_resid = cfq_scaled_cfqq_slice(cfqd, cfqq);
                 else
                         cfqq->slice_resid = cfqq->slice_end - ktime_get_ns();
-               cfq_log_cfqq(cfqd, cfqq, "resid=%llu", cfqq->slice_resid);
+               cfq_log_cfqq(cfqd, cfqq, "resid=%lld", cfqq->slice_resid);
         }
  
         cfq_group_served(cfqd, cfqq->cfqg, cfqq);
@@ -2989,7 +2996,8 @@ static void cfq_arm_slice_timer(struct cfq_data *cfqd)
         else
                 sl = cfqd->cfq_slice_idle;
  
-       mod_timer(&cfqd->idle_slice_timer, now + sl);
+       hrtimer_start(&cfqd->idle_slice_timer, ns_to_ktime(sl),
+                     HRTIMER_MODE_REL);
         cfqg_stats_set_start_idle_time(cfqq->cfqg);
         cfq_log_cfqq(cfqd, cfqq, "arm_idle: %llu group_idle: %d", sl,
                         group_idle ? 1 : 0);
@@ -3308,7 +3316,7 @@ static struct cfq_queue *cfq_select_queue(struct cfq_data *cfqd)
          * flight or is idling for a new request, allow either of these
          * conditions to happen (or time out) before selecting a new queue.
          */
-       if (timer_pending(&cfqd->idle_slice_timer)) {
+       if (hrtimer_active(&cfqd->idle_slice_timer)) {
                 cfqq = NULL;
                 goto keep_queue;
         }
@@ -3699,6 +3707,7 @@ static void cfq_init_prio_data(struct cfq_queue *cfqq, struct cfq_io_cq *cic)
          * elevate the priority of this queue
          */
         cfqq->org_ioprio = cfqq->ioprio;
+       cfqq->org_ioprio_class = cfqq->ioprio_class;
         cfq_clear_cfqq_prio_changed(cfqq);
  }
  
@@ -4241,7 +4250,16 @@ static void cfq_completed_request(struct request_queue *q, struct request *rq)
                                         cfqq_type(cfqq));
  
                 st->ttime.last_end_request = now;
-               if (!(rq->start_time + cfqd->cfq_fifo_expire[1] > now))
+               /*
+                * We have to do this check in jiffies since start_time is in
+                * jiffies and it is not trivial to convert to ns. If
+                * cfq_fifo_expire[1] ever comes close to 1 jiffie, this test
+                * will become problematic but so far we are fine (the default
+                * is 128 ms).
+                */
+               if (!time_after(rq->start_time +
+                                 nsecs_to_jiffies(cfqd->cfq_fifo_expire[1]),
+                               jiffies))
                         cfqd->last_delayed_sync = now;
         }
  
@@ -4294,6 +4312,24 @@ static void cfq_completed_request(struct request_queue *q, struct request *rq)
                 cfq_schedule_dispatch(cfqd);
  }
  
+static void cfqq_boost_on_prio(struct cfq_queue *cfqq, int op_flags)
+{
+       /*
+        * If REQ_PRIO is set, boost class and prio level, if it's below
+        * BE/NORM. If prio is not set, restore the potentially boosted
+        * class/prio level.
+        */
+       if (!(op_flags & REQ_PRIO)) {
+               cfqq->ioprio_class = cfqq->org_ioprio_class;
+               cfqq->ioprio = cfqq->org_ioprio;
+       } else {
+               if (cfq_class_idle(cfqq))
+                       cfqq->ioprio_class = IOPRIO_CLASS_BE;
+               if (cfqq->ioprio > IOPRIO_NORM)
+                       cfqq->ioprio = IOPRIO_NORM;
+       }
+}
+
  static inline int __cfq_may_queue(struct cfq_queue *cfqq)
  {
         if (cfq_cfqq_wait_request(cfqq) && !cfq_cfqq_must_alloc_slice(cfqq)) {
@@ -4324,6 +4360,7 @@ static int cfq_may_queue(struct request_queue *q, int op, int op_flags)
         cfqq = cic_to_cfqq(cic, rw_is_sync(op, op_flags));
         if (cfqq) {
                 cfq_init_prio_data(cfqq, cic);
+               cfqq_boost_on_prio(cfqq, op_flags);
  
                 return __cfq_may_queue(cfqq);
         }
@@ -4454,9 +4491,10 @@ static void cfq_kick_queue(struct work_struct *work)
  /*
   * Timer running if the active_queue is currently idling inside its time slice
   */
-static void cfq_idle_slice_timer(unsigned long data)
+static enum hrtimer_restart cfq_idle_slice_timer(struct hrtimer *timer)
  {
-       struct cfq_data *cfqd = (struct cfq_data *) data;
+       struct cfq_data *cfqd = container_of(timer, struct cfq_data,
+                                            idle_slice_timer);
         struct cfq_queue *cfqq;
         unsigned long flags;
         int timed_out = 1;
@@ -4505,11 +4543,12 @@ out_kick:
         cfq_schedule_dispatch(cfqd);
  out_cont:
         spin_unlock_irqrestore(cfqd->queue->queue_lock, flags);
+       return HRTIMER_NORESTART;
  }
  
  static void cfq_shutdown_timer_wq(struct cfq_data *cfqd)
  {
-       del_timer_sync(&cfqd->idle_slice_timer);
+       hrtimer_cancel(&cfqd->idle_slice_timer);
         cancel_work_sync(&cfqd->unplug_work);
  }
  
@@ -4605,9 +4644,9 @@ static int cfq_init_queue(struct request_queue *q, struct elevator_type *e)
         cfqg_put(cfqd->root_group);
         spin_unlock_irq(q->queue_lock);
  
-       init_timer(&cfqd->idle_slice_timer);
+       hrtimer_init(&cfqd->idle_slice_timer, CLOCK_MONOTONIC,
+                    HRTIMER_MODE_REL);
         cfqd->idle_slice_timer.function = cfq_idle_slice_timer;
-       cfqd->idle_slice_timer.data = (unsigned long) cfqd;
  
         INIT_WORK(&cfqd->unplug_work, cfq_kick_queue);
  
@@ -4690,6 +4729,21 @@ SHOW_FUNCTION(cfq_low_latency_show, cfqd->cfq_latency, 0);
  SHOW_FUNCTION(cfq_target_latency_show, cfqd->cfq_target_latency, 1);
  #undef SHOW_FUNCTION
  
+#define USEC_SHOW_FUNCTION(__FUNC, __VAR)                              \
+static ssize_t __FUNC(struct elevator_queue *e, char *page)            \
+{                                                                      \
+       struct cfq_data *cfqd = e->elevator_data;                       \
+       u64 __data = __VAR;                                             \
+       __data = div_u64(__data, NSEC_PER_USEC);                        \
+       return cfq_var_show(__data, (page));                            \
+}
+USEC_SHOW_FUNCTION(cfq_slice_idle_us_show, cfqd->cfq_slice_idle);
+USEC_SHOW_FUNCTION(cfq_group_idle_us_show, cfqd->cfq_group_idle);
+USEC_SHOW_FUNCTION(cfq_slice_sync_us_show, cfqd->cfq_slice[1]);
+USEC_SHOW_FUNCTION(cfq_slice_async_us_show, cfqd->cfq_slice[0]);
+USEC_SHOW_FUNCTION(cfq_target_latency_us_show, cfqd->cfq_target_latency);
+#undef USEC_SHOW_FUNCTION
+
  #define STORE_FUNCTION(__FUNC, __PTR, MIN, MAX, __CONV)                        \
  static ssize_t __FUNC(struct elevator_queue *e, const char *page, size_t count)        \
  {                                                                      \
@@ -4724,6 +4778,26 @@ STORE_FUNCTION(cfq_low_latency_store, &cfqd->cfq_latency, 0, 1, 0);
  STORE_FUNCTION(cfq_target_latency_store, &cfqd->cfq_target_latency, 1, UINT_MAX, 1);
  #undef STORE_FUNCTION
  
+#define USEC_STORE_FUNCTION(__FUNC, __PTR, MIN, MAX)                   \
+static ssize_t __FUNC(struct elevator_queue *e, const char *page, size_t count)        \
+{                                                                      \
+       struct cfq_data *cfqd = e->elevator_data;                       \
+       unsigned int __data;                                            \
+       int ret = cfq_var_store(&__data, (page), count);                \
+       if (__data < (MIN))                                             \
+               __data = (MIN);                                         \
+       else if (__data > (MAX))                                        \
+               __data = (MAX);                                         \
+       *(__PTR) = (u64)__data * NSEC_PER_USEC;                         \
+       return ret;                                                     \
+}
+USEC_STORE_FUNCTION(cfq_slice_idle_us_store, &cfqd->cfq_slice_idle, 0, UINT_MAX);
+USEC_STORE_FUNCTION(cfq_group_idle_us_store, &cfqd->cfq_group_idle, 0, UINT_MAX);
+USEC_STORE_FUNCTION(cfq_slice_sync_us_store, &cfqd->cfq_slice[1], 1, UINT_MAX);
+USEC_STORE_FUNCTION(cfq_slice_async_us_store, &cfqd->cfq_slice[0], 1, UINT_MAX);
+USEC_STORE_FUNCTION(cfq_target_latency_us_store, &cfqd->cfq_target_latency, 1, UINT_MAX);
+#undef USEC_STORE_FUNCTION
+
  #define CFQ_ATTR(name) \
         __ATTR(name, S_IRUGO|S_IWUSR, cfq_##name##_show, cfq_##name##_store)
  
@@ -4734,12 +4808,17 @@ static struct elv_fs_entry cfq_attrs[] = {
         CFQ_ATTR(back_seek_max),
         CFQ_ATTR(back_seek_penalty),
         CFQ_ATTR(slice_sync),
+       CFQ_ATTR(slice_sync_us),
         CFQ_ATTR(slice_async),
+       CFQ_ATTR(slice_async_us),
         CFQ_ATTR(slice_async_rq),
         CFQ_ATTR(slice_idle),
+       CFQ_ATTR(slice_idle_us),
         CFQ_ATTR(group_idle),
+       CFQ_ATTR(group_idle_us),
         CFQ_ATTR(low_latency),
         CFQ_ATTR(target_latency),
+       CFQ_ATTR(target_latency_us),
         __ATTR_NULL
  };
  
@@ -4748,7 +4827,8 @@ static struct elevator_type iosched_cfq = {
                 .elevator_merge_fn =            cfq_merge,
                 .elevator_merged_fn =           cfq_merged_request,
                 .elevator_merge_req_fn =        cfq_merged_requests,
-               .elevator_allow_merge_fn =      cfq_allow_merge,
+               .elevator_allow_bio_merge_fn =  cfq_allow_bio_merge,
+               .elevator_allow_rq_merge_fn =   cfq_allow_rq_merge,
                 .elevator_bio_merged_fn =       cfq_bio_merged,
                 .elevator_dispatch_fn =         cfq_dispatch_requests,
                 .elevator_add_req_fn =          cfq_insert_request,