cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

ioprio.rst (4774B)


      1===================
      2Block io priorities
      3===================
      4
      5
      6Intro
      7-----
      8
      9With the introduction of cfq v3 (aka cfq-ts or time sliced cfq), basic io
     10priorities are supported for reads on files.  This enables users to io nice
     11processes or process groups, similar to what has been possible with cpu
     12scheduling for ages.  This document mainly details the current possibilities
     13with cfq; other io schedulers do not support io priorities thus far.
     14
     15Scheduling classes
     16------------------
     17
     18CFQ implements three generic scheduling classes that determine how io is
     19served for a process.
     20
     21IOPRIO_CLASS_RT: This is the realtime io class. This scheduling class is given
     22higher priority than any other in the system, processes from this class are
     23given first access to the disk every time. Thus it needs to be used with some
     24care, one io RT process can starve the entire system. Within the RT class,
     25there are 8 levels of class data that determine exactly how much time this
     26process needs the disk for on each service. In the future this might change
     27to be more directly mappable to performance, by passing in a wanted data
     28rate instead.
     29
     30IOPRIO_CLASS_BE: This is the best-effort scheduling class, which is the default
     31for any process that hasn't set a specific io priority. The class data
     32determines how much io bandwidth the process will get, it's directly mappable
     33to the cpu nice levels just more coarsely implemented. 0 is the highest
     34BE prio level, 7 is the lowest. The mapping between cpu nice level and io
     35nice level is determined as: io_nice = (cpu_nice + 20) / 5.
     36
     37IOPRIO_CLASS_IDLE: This is the idle scheduling class, processes running at this
     38level only get io time when no one else needs the disk. The idle class has no
     39class data, since it doesn't really apply here.
     40
     41Tools
     42-----
     43
     44See below for a sample ionice tool. Usage::
     45
     46	# ionice -c<class> -n<level> -p<pid>
     47
     48If pid isn't given, the current process is assumed. IO priority settings
     49are inherited on fork, so you can use ionice to start the process at a given
     50level::
     51
     52	# ionice -c2 -n0 /bin/ls
     53
     54will run ls at the best-effort scheduling class at the highest priority.
     55For a running process, you can give the pid instead::
     56
     57	# ionice -c1 -n2 -p100
     58
     59will change pid 100 to run at the realtime scheduling class, at priority 2.
     60
     61ionice.c tool::
     62
     63  #include <stdio.h>
     64  #include <stdlib.h>
     65  #include <errno.h>
     66  #include <getopt.h>
     67  #include <unistd.h>
     68  #include <sys/ptrace.h>
     69  #include <asm/unistd.h>
     70
     71  extern int sys_ioprio_set(int, int, int);
     72  extern int sys_ioprio_get(int, int);
     73
     74  #if defined(__i386__)
     75  #define __NR_ioprio_set		289
     76  #define __NR_ioprio_get		290
     77  #elif defined(__ppc__)
     78  #define __NR_ioprio_set		273
     79  #define __NR_ioprio_get		274
     80  #elif defined(__x86_64__)
     81  #define __NR_ioprio_set		251
     82  #define __NR_ioprio_get		252
     83  #elif defined(__ia64__)
     84  #define __NR_ioprio_set		1274
     85  #define __NR_ioprio_get		1275
     86  #else
     87  #error "Unsupported arch"
     88  #endif
     89
     90  static inline int ioprio_set(int which, int who, int ioprio)
     91  {
     92	return syscall(__NR_ioprio_set, which, who, ioprio);
     93  }
     94
     95  static inline int ioprio_get(int which, int who)
     96  {
     97	return syscall(__NR_ioprio_get, which, who);
     98  }
     99
    100  enum {
    101	IOPRIO_CLASS_NONE,
    102	IOPRIO_CLASS_RT,
    103	IOPRIO_CLASS_BE,
    104	IOPRIO_CLASS_IDLE,
    105  };
    106
    107  enum {
    108	IOPRIO_WHO_PROCESS = 1,
    109	IOPRIO_WHO_PGRP,
    110	IOPRIO_WHO_USER,
    111  };
    112
    113  #define IOPRIO_CLASS_SHIFT	13
    114
    115  const char *to_prio[] = { "none", "realtime", "best-effort", "idle", };
    116
    117  int main(int argc, char *argv[])
    118  {
    119	int ioprio = 4, set = 0, ioprio_class = IOPRIO_CLASS_BE;
    120	int c, pid = 0;
    121
    122	while ((c = getopt(argc, argv, "+n:c:p:")) != EOF) {
    123		switch (c) {
    124		case 'n':
    125			ioprio = strtol(optarg, NULL, 10);
    126			set = 1;
    127			break;
    128		case 'c':
    129			ioprio_class = strtol(optarg, NULL, 10);
    130			set = 1;
    131			break;
    132		case 'p':
    133			pid = strtol(optarg, NULL, 10);
    134			break;
    135		}
    136	}
    137
    138	switch (ioprio_class) {
    139		case IOPRIO_CLASS_NONE:
    140			ioprio_class = IOPRIO_CLASS_BE;
    141			break;
    142		case IOPRIO_CLASS_RT:
    143		case IOPRIO_CLASS_BE:
    144			break;
    145		case IOPRIO_CLASS_IDLE:
    146			ioprio = 7;
    147			break;
    148		default:
    149			printf("bad prio class %d\n", ioprio_class);
    150			return 1;
    151	}
    152
    153	if (!set) {
    154		if (!pid && argv[optind])
    155			pid = strtol(argv[optind], NULL, 10);
    156
    157		ioprio = ioprio_get(IOPRIO_WHO_PROCESS, pid);
    158
    159		printf("pid=%d, %d\n", pid, ioprio);
    160
    161		if (ioprio == -1)
    162			perror("ioprio_get");
    163		else {
    164			ioprio_class = ioprio >> IOPRIO_CLASS_SHIFT;
    165			ioprio = ioprio & 0xff;
    166			printf("%s: prio %d\n", to_prio[ioprio_class], ioprio);
    167		}
    168	} else {
    169		if (ioprio_set(IOPRIO_WHO_PROCESS, pid, ioprio | ioprio_class << IOPRIO_CLASS_SHIFT) == -1) {
    170			perror("ioprio_set");
    171			return 1;
    172		}
    173
    174		if (argv[optind])
    175			execvp(argv[optind], &argv[optind]);
    176	}
    177
    178	return 0;
    179  }
    180
    181
    182March 11 2005, Jens Axboe <jens.axboe@oracle.com>