1 /* $NetBSD: rf_cvscan.c,v 1.14 2006/10/12 01:31:50 christos Exp $ */
3 * Copyright (c) 1995 Carnegie-Mellon University.
8 * Permission to use, copy, modify and distribute this software and
9 * its documentation is hereby granted, provided that both the copyright
10 * notice and this permission notice appear in all copies of the
11 * software, derivative works or modified versions, and any portions
12 * thereof, and that both notices appear in supporting documentation.
14 * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
15 * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
16 * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
18 * Carnegie Mellon requests users of this software to return to
20 * Software Distribution Coordinator or Software.Distribution@CS.CMU.EDU
21 * School of Computer Science
22 * Carnegie Mellon University
23 * Pittsburgh PA 15213-3890
25 * any improvements or extensions that they make and grant Carnegie the
26 * rights to redistribute these changes.
29 /*******************************************************************************
31 * cvscan.c -- prioritized cvscan disk queueing code.
33 * Nov 9, 1994, adapted from raidSim version (MCH)
35 ******************************************************************************/
37 #include <sys/cdefs.h>
38 __KERNEL_RCSID(0, "$NetBSD: rf_cvscan.c,v 1.14 2006/10/12 01:31:50 christos Exp $");
40 #include <dev/raidframe/raidframevar.h>
41 #include "rf_alloclist.h"
42 #include "rf_stripelocks.h"
43 #include "rf_layout.h"
44 #include "rf_diskqueue.h"
45 #include "rf_cvscan.h"
46 #include "rf_debugMem.h"
47 #include "rf_general.h"
49 #define DO_CHECK_STATE(_hdr_) CheckCvscanState((_hdr_))
51 #define pri_ok(p) ( ((p) == RF_IO_NORMAL_PRIORITY) || ((p) == RF_IO_LOW_PRIORITY))
54 CheckCvscanState(RF_CvscanHeader_t
*hdr
)
57 RF_DiskQueueData_t
*tmp
;
59 if (hdr
->left
!= (RF_DiskQueueData_t
*) NULL
)
60 RF_ASSERT(hdr
->left
->sectorOffset
< hdr
->cur_block
);
61 for (key
= hdr
->cur_block
, i
= 0, tmp
= hdr
->left
;
62 tmp
!= (RF_DiskQueueData_t
*) NULL
;
63 key
= tmp
->sectorOffset
, i
++, tmp
= tmp
->next
)
64 RF_ASSERT(tmp
->sectorOffset
<= key
65 && tmp
->priority
== hdr
->nxt_priority
&& pri_ok(tmp
->priority
));
66 RF_ASSERT(i
== hdr
->left_cnt
);
68 for (key
= hdr
->cur_block
, i
= 0, tmp
= hdr
->right
;
69 tmp
!= (RF_DiskQueueData_t
*) NULL
;
70 key
= tmp
->sectorOffset
, i
++, tmp
= tmp
->next
) {
71 RF_ASSERT(key
<= tmp
->sectorOffset
);
72 RF_ASSERT(tmp
->priority
== hdr
->nxt_priority
);
73 RF_ASSERT(pri_ok(tmp
->priority
));
75 RF_ASSERT(i
== hdr
->right_cnt
);
77 for (key
= hdr
->nxt_priority
- 1, tmp
= hdr
->burner
;
78 tmp
!= (RF_DiskQueueData_t
*) NULL
;
79 key
= tmp
->priority
, tmp
= tmp
->next
) {
82 RF_ASSERT(pri_ok(tmp
->priority
));
83 RF_ASSERT(key
>= tmp
->priority
);
84 RF_ASSERT(tmp
->priority
< hdr
->nxt_priority
);
91 PriorityInsert(RF_DiskQueueData_t
**list_ptr
, RF_DiskQueueData_t
*req
)
93 /* * insert block pointed to by req in to list whose first * entry is
94 * pointed to by the pointer that list_ptr points to * ie., list_ptr
95 * is a grandparent of the first entry */
97 for (; (*list_ptr
) != (RF_DiskQueueData_t
*) NULL
&&
98 (*list_ptr
)->priority
> req
->priority
;
99 list_ptr
= &((*list_ptr
)->next
)) {
101 req
->next
= (*list_ptr
);
108 ReqInsert(RF_DiskQueueData_t
**list_ptr
, RF_DiskQueueData_t
*req
, RF_CvscanArmDir_t order
)
110 /* * insert block pointed to by req in to list whose first * entry is
111 * pointed to by the pointer that list_ptr points to * ie., list_ptr
112 * is a grandparent of the first entry */
114 for (; (*list_ptr
) != (RF_DiskQueueData_t
*) NULL
&&
116 ((order
== rf_cvscan_RIGHT
&& (*list_ptr
)->sectorOffset
<= req
->sectorOffset
)
117 || (order
== rf_cvscan_LEFT
&& (*list_ptr
)->sectorOffset
> req
->sectorOffset
));
118 list_ptr
= &((*list_ptr
)->next
)) {
120 req
->next
= (*list_ptr
);
126 static RF_DiskQueueData_t
*
127 ReqDequeue(RF_DiskQueueData_t
**list_ptr
)
129 RF_DiskQueueData_t
*ret
= (*list_ptr
);
130 if ((*list_ptr
) != (RF_DiskQueueData_t
*) NULL
) {
131 (*list_ptr
) = (*list_ptr
)->next
;
139 ReBalance(RF_CvscanHeader_t
*hdr
)
141 /* DO_CHECK_STATE(hdr); */
142 while (hdr
->right
!= (RF_DiskQueueData_t
*) NULL
143 && hdr
->right
->sectorOffset
< hdr
->cur_block
) {
146 ReqInsert(&hdr
->left
, ReqDequeue(&hdr
->right
), rf_cvscan_LEFT
);
148 /* DO_CHECK_STATE(hdr); */
154 Transfer(RF_DiskQueueData_t
**to_list_ptr
, RF_DiskQueueData_t
**from_list_ptr
)
156 RF_DiskQueueData_t
*gp
;
157 for (gp
= (*from_list_ptr
); gp
!= (RF_DiskQueueData_t
*) NULL
;) {
158 RF_DiskQueueData_t
*p
= gp
->next
;
159 PriorityInsert(to_list_ptr
, gp
);
162 (*from_list_ptr
) = (RF_DiskQueueData_t
*) NULL
;
168 RealEnqueue(RF_CvscanHeader_t
*hdr
, RF_DiskQueueData_t
*req
)
170 RF_ASSERT(req
->priority
== RF_IO_NORMAL_PRIORITY
|| req
->priority
== RF_IO_LOW_PRIORITY
);
173 if (hdr
->left_cnt
== 0 && hdr
->right_cnt
== 0) {
174 hdr
->nxt_priority
= req
->priority
;
176 if (req
->priority
> hdr
->nxt_priority
) {
178 ** dump all other outstanding requests on the back burner
180 Transfer(&hdr
->burner
, &hdr
->left
);
181 Transfer(&hdr
->burner
, &hdr
->right
);
184 hdr
->nxt_priority
= req
->priority
;
186 if (req
->priority
< hdr
->nxt_priority
) {
188 ** yet another low priority task!
190 PriorityInsert(&hdr
->burner
, req
);
192 if (req
->sectorOffset
< hdr
->cur_block
) {
193 /* this request is to the left of the current arms */
194 ReqInsert(&hdr
->left
, req
, rf_cvscan_LEFT
);
197 /* this request is to the right of the current arms */
198 ReqInsert(&hdr
->right
, req
, rf_cvscan_RIGHT
);
208 rf_CvscanEnqueue(void *q_in
, RF_DiskQueueData_t
* elem
, int priority
)
210 RF_CvscanHeader_t
*hdr
= (RF_CvscanHeader_t
*) q_in
;
211 RealEnqueue(hdr
, elem
/* req */ );
217 rf_CvscanDequeue(void *q_in
)
219 RF_CvscanHeader_t
*hdr
= (RF_CvscanHeader_t
*) q_in
;
220 long range
, i
, sum_dist_left
, sum_dist_right
;
221 RF_DiskQueueData_t
*ret
;
222 RF_DiskQueueData_t
*tmp
;
226 if (hdr
->left_cnt
== 0 && hdr
->right_cnt
== 0)
227 return ((RF_DiskQueueData_t
*) NULL
);
229 range
= RF_MIN(hdr
->range_for_avg
, RF_MIN(hdr
->left_cnt
, hdr
->right_cnt
));
230 for (i
= 0, tmp
= hdr
->left
, sum_dist_left
=
231 ((hdr
->direction
== rf_cvscan_RIGHT
) ? range
* hdr
->change_penalty
: 0);
232 tmp
!= (RF_DiskQueueData_t
*) NULL
&& i
< range
;
233 tmp
= tmp
->next
, i
++) {
234 sum_dist_left
+= hdr
->cur_block
- tmp
->sectorOffset
;
236 for (i
= 0, tmp
= hdr
->right
, sum_dist_right
=
237 ((hdr
->direction
== rf_cvscan_LEFT
) ? range
* hdr
->change_penalty
: 0);
238 tmp
!= (RF_DiskQueueData_t
*) NULL
&& i
< range
;
239 tmp
= tmp
->next
, i
++) {
240 sum_dist_right
+= tmp
->sectorOffset
- hdr
->cur_block
;
243 if (hdr
->right_cnt
== 0 || sum_dist_left
< sum_dist_right
) {
244 hdr
->direction
= rf_cvscan_LEFT
;
245 hdr
->cur_block
= hdr
->left
->sectorOffset
+ hdr
->left
->numSector
;
246 hdr
->left_cnt
= RF_MAX(hdr
->left_cnt
- 1, 0);
248 ret
= (ReqDequeue(&hdr
->left
)) /*->parent*/ ;
250 hdr
->direction
= rf_cvscan_RIGHT
;
251 hdr
->cur_block
= hdr
->right
->sectorOffset
+ hdr
->right
->numSector
;
252 hdr
->right_cnt
= RF_MAX(hdr
->right_cnt
- 1, 0);
254 ret
= (ReqDequeue(&hdr
->right
)) /*->parent*/ ;
258 if (hdr
->left_cnt
== 0 && hdr
->right_cnt
== 0
259 && hdr
->burner
!= (RF_DiskQueueData_t
*) NULL
) {
261 ** restore low priority requests for next dequeue
263 RF_DiskQueueData_t
*burner
= hdr
->burner
;
264 hdr
->nxt_priority
= burner
->priority
;
265 while (burner
!= (RF_DiskQueueData_t
*) NULL
266 && burner
->priority
== hdr
->nxt_priority
) {
267 RF_DiskQueueData_t
*next
= burner
->next
;
268 RealEnqueue(hdr
, burner
);
271 hdr
->burner
= burner
;
280 rf_CvscanPeek(void *q_in
)
282 RF_CvscanHeader_t
*hdr
= (RF_CvscanHeader_t
*) q_in
;
283 long range
, i
, sum_dist_left
, sum_dist_right
;
284 RF_DiskQueueData_t
*tmp
, *headElement
;
288 if (hdr
->left_cnt
== 0 && hdr
->right_cnt
== 0)
291 range
= RF_MIN(hdr
->range_for_avg
, RF_MIN(hdr
->left_cnt
, hdr
->right_cnt
));
292 for (i
= 0, tmp
= hdr
->left
, sum_dist_left
=
293 ((hdr
->direction
== rf_cvscan_RIGHT
) ? range
* hdr
->change_penalty
: 0);
294 tmp
!= (RF_DiskQueueData_t
*) NULL
&& i
< range
;
295 tmp
= tmp
->next
, i
++) {
296 sum_dist_left
+= hdr
->cur_block
- tmp
->sectorOffset
;
298 for (i
= 0, tmp
= hdr
->right
, sum_dist_right
=
299 ((hdr
->direction
== rf_cvscan_LEFT
) ? range
* hdr
->change_penalty
: 0);
300 tmp
!= (RF_DiskQueueData_t
*) NULL
&& i
< range
;
301 tmp
= tmp
->next
, i
++) {
302 sum_dist_right
+= tmp
->sectorOffset
- hdr
->cur_block
;
305 if (hdr
->right_cnt
== 0 || sum_dist_left
< sum_dist_right
)
306 headElement
= hdr
->left
;
308 headElement
= hdr
->right
;
310 return (headElement
);
316 ** CVSCAN( 1, 0 ) is Shortest Seek Time First (SSTF)
317 ** lowest average response time
318 ** CVSCAN( 1, infinity ) is SCAN
319 ** lowest response time standard deviation
323 rf_CvscanCreate(RF_SectorCount_t sectPerDisk
,
324 RF_AllocListElem_t
*clList
,
325 RF_ShutdownList_t
**listp
)
327 RF_CvscanHeader_t
*hdr
;
328 long range
= 2; /* Currently no mechanism to change these */
329 long penalty
= sectPerDisk
/ 5;
331 RF_MallocAndAdd(hdr
, sizeof(RF_CvscanHeader_t
), (RF_CvscanHeader_t
*), clList
);
332 memset((char *) hdr
, 0, sizeof(RF_CvscanHeader_t
));
333 hdr
->range_for_avg
= RF_MAX(range
, 1);
334 hdr
->change_penalty
= RF_MAX(penalty
, 0);
335 hdr
->direction
= rf_cvscan_RIGHT
;
337 hdr
->left_cnt
= hdr
->right_cnt
= 0;
338 hdr
->left
= hdr
->right
= (RF_DiskQueueData_t
*) NULL
;
339 hdr
->burner
= (RF_DiskQueueData_t
*) NULL
;
342 return ((void *) hdr
);
346 #if defined(__NetBSD__) && defined(_KERNEL)
347 /* PrintCvscanQueue is not used, so we ignore it... */
350 PrintCvscanQueue(RF_CvscanHeader_t
*hdr
)
352 RF_DiskQueueData_t
*tmp
;
354 printf("CVSCAN(%d,%d) at %d going %s\n",
355 (int) hdr
->range_for_avg
,
356 (int) hdr
->change_penalty
,
357 (int) hdr
->cur_block
,
358 (hdr
->direction
== rf_cvscan_LEFT
) ? "LEFT" : "RIGHT");
359 printf("\tLeft(%d): ", hdr
->left_cnt
);
360 for (tmp
= hdr
->left
; tmp
!= (RF_DiskQueueData_t
*) NULL
; tmp
= tmp
->next
)
361 printf("(%d,%ld,%d) ",
362 (int) tmp
->sectorOffset
,
363 (long) (tmp
->sectorOffset
+ tmp
->numSector
),
366 printf("\tRight(%d): ", hdr
->right_cnt
);
367 for (tmp
= hdr
->right
; tmp
!= (RF_DiskQueueData_t
*) NULL
; tmp
= tmp
->next
)
368 printf("(%d,%ld,%d) ",
369 (int) tmp
->sectorOffset
,
370 (long) (tmp
->sectorOffset
+ tmp
->numSector
),
373 printf("\tBurner: ");
374 for (tmp
= hdr
->burner
; tmp
!= (RF_DiskQueueData_t
*) NULL
; tmp
= tmp
->next
)
375 printf("(%d,%ld,%d) ",
376 (int) tmp
->sectorOffset
,
377 (long) (tmp
->sectorOffset
+ tmp
->numSector
),
384 /* promotes reconstruction accesses for the given stripeID to normal priority.
385 * returns 1 if an access was found and zero otherwise. Normally, we should
386 * only have one or zero entries in the burner queue, so execution time should
390 rf_CvscanPromote(void *q_in
, RF_StripeNum_t parityStripeID
,
391 RF_ReconUnitNum_t which_ru
)
393 RF_CvscanHeader_t
*hdr
= (RF_CvscanHeader_t
*) q_in
;
394 RF_DiskQueueData_t
*trailer
= NULL
, *tmp
= hdr
->burner
, *tlist
= NULL
;
398 while (tmp
) { /* handle entries at the front of the list */
399 if (tmp
->parityStripeID
== parityStripeID
&& tmp
->which_ru
== which_ru
) {
400 hdr
->burner
= tmp
->next
;
401 tmp
->priority
= RF_IO_NORMAL_PRIORITY
;
412 while (tmp
) { /* handle entries on the rest of the list */
413 if (tmp
->parityStripeID
== parityStripeID
&& tmp
->which_ru
== which_ru
) {
414 trailer
->next
= tmp
->next
;
415 tmp
->priority
= RF_IO_NORMAL_PRIORITY
;
417 tlist
= tmp
; /* insert on a temp queue */
427 RealEnqueue(hdr
, tlist
);
430 RF_ASSERT(retval
== 0 || retval
== 1);
431 DO_CHECK_STATE((RF_CvscanHeader_t
*) q_in
);