xref: /kernel/linux/linux-5.10/drivers/s390/cio/cmf.c (revision 8c2ecf20)
1// SPDX-License-Identifier: GPL-2.0+
2/*
3 * Linux on zSeries Channel Measurement Facility support
4 *
5 * Copyright IBM Corp. 2000, 2006
6 *
7 * Authors: Arnd Bergmann <arndb@de.ibm.com>
8 *	    Cornelia Huck <cornelia.huck@de.ibm.com>
9 *
10 * original idea from Natarajan Krishnaswami <nkrishna@us.ibm.com>
11 */
12
13#define KMSG_COMPONENT "cio"
14#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
15
16#include <linux/memblock.h>
17#include <linux/device.h>
18#include <linux/init.h>
19#include <linux/list.h>
20#include <linux/export.h>
21#include <linux/moduleparam.h>
22#include <linux/slab.h>
23#include <linux/timex.h>	/* get_tod_clock() */
24
25#include <asm/ccwdev.h>
26#include <asm/cio.h>
27#include <asm/cmb.h>
28#include <asm/div64.h>
29
30#include "cio.h"
31#include "css.h"
32#include "device.h"
33#include "ioasm.h"
34#include "chsc.h"
35
36/*
37 * parameter to enable cmf during boot, possible uses are:
38 *  "s390cmf" -- enable cmf and allocate 2 MB of ram so measuring can be
39 *               used on any subchannel
40 *  "s390cmf=<num>" -- enable cmf and allocate enough memory to measure
41 *                     <num> subchannel, where <num> is an integer
42 *                     between 1 and 65535, default is 1024
43 */
44#define ARGSTRING "s390cmf"
45
46/* indices for READCMB */
47enum cmb_index {
48	avg_utilization = -1,
49 /* basic and exended format: */
50	cmb_ssch_rsch_count = 0,
51	cmb_sample_count,
52	cmb_device_connect_time,
53	cmb_function_pending_time,
54	cmb_device_disconnect_time,
55	cmb_control_unit_queuing_time,
56	cmb_device_active_only_time,
57 /* extended format only: */
58	cmb_device_busy_time,
59	cmb_initial_command_response_time,
60};
61
62/**
63 * enum cmb_format - types of supported measurement block formats
64 *
65 * @CMF_BASIC:      traditional channel measurement blocks supported
66 *		    by all machines that we run on
67 * @CMF_EXTENDED:   improved format that was introduced with the z990
68 *		    machine
69 * @CMF_AUTODETECT: default: use extended format when running on a machine
70 *		    supporting extended format, otherwise fall back to
71 *		    basic format
72 */
73enum cmb_format {
74	CMF_BASIC,
75	CMF_EXTENDED,
76	CMF_AUTODETECT = -1,
77};
78
79/*
80 * format - actual format for all measurement blocks
81 *
82 * The format module parameter can be set to a value of 0 (zero)
83 * or 1, indicating basic or extended format as described for
84 * enum cmb_format.
85 */
86static int format = CMF_AUTODETECT;
87module_param(format, bint, 0444);
88
89/**
90 * struct cmb_operations - functions to use depending on cmb_format
91 *
92 * Most of these functions operate on a struct ccw_device. There is only
93 * one instance of struct cmb_operations because the format of the measurement
94 * data is guaranteed to be the same for every ccw_device.
95 *
96 * @alloc:	allocate memory for a channel measurement block,
97 *		either with the help of a special pool or with kmalloc
98 * @free:	free memory allocated with @alloc
99 * @set:	enable or disable measurement
100 * @read:	read a measurement entry at an index
101 * @readall:	read a measurement block in a common format
102 * @reset:	clear the data in the associated measurement block and
103 *		reset its time stamp
104 */
105struct cmb_operations {
106	int  (*alloc)  (struct ccw_device *);
107	void (*free)   (struct ccw_device *);
108	int  (*set)    (struct ccw_device *, u32);
109	u64  (*read)   (struct ccw_device *, int);
110	int  (*readall)(struct ccw_device *, struct cmbdata *);
111	void (*reset)  (struct ccw_device *);
112/* private: */
113	struct attribute_group *attr_group;
114};
115static struct cmb_operations *cmbops;
116
117struct cmb_data {
118	void *hw_block;   /* Pointer to block updated by hardware */
119	void *last_block; /* Last changed block copied from hardware block */
120	int size;	  /* Size of hw_block and last_block */
121	unsigned long long last_update;  /* when last_block was updated */
122};
123
124/*
125 * Our user interface is designed in terms of nanoseconds,
126 * while the hardware measures total times in its own
127 * unit.
128 */
129static inline u64 time_to_nsec(u32 value)
130{
131	return ((u64)value) * 128000ull;
132}
133
134/*
135 * Users are usually interested in average times,
136 * not accumulated time.
137 * This also helps us with atomicity problems
138 * when reading sinlge values.
139 */
140static inline u64 time_to_avg_nsec(u32 value, u32 count)
141{
142	u64 ret;
143
144	/* no samples yet, avoid division by 0 */
145	if (count == 0)
146		return 0;
147
148	/* value comes in units of 128 µsec */
149	ret = time_to_nsec(value);
150	do_div(ret, count);
151
152	return ret;
153}
154
155#define CMF_OFF 0
156#define CMF_ON	2
157
158/*
159 * Activate or deactivate the channel monitor. When area is NULL,
160 * the monitor is deactivated. The channel monitor needs to
161 * be active in order to measure subchannels, which also need
162 * to be enabled.
163 */
164static inline void cmf_activate(void *area, unsigned int onoff)
165{
166	register void * __gpr2 asm("2");
167	register long __gpr1 asm("1");
168
169	__gpr2 = area;
170	__gpr1 = onoff;
171	/* activate channel measurement */
172	asm("schm" : : "d" (__gpr2), "d" (__gpr1) );
173}
174
175static int set_schib(struct ccw_device *cdev, u32 mme, int mbfc,
176		     unsigned long address)
177{
178	struct subchannel *sch = to_subchannel(cdev->dev.parent);
179	int ret;
180
181	sch->config.mme = mme;
182	sch->config.mbfc = mbfc;
183	/* address can be either a block address or a block index */
184	if (mbfc)
185		sch->config.mba = address;
186	else
187		sch->config.mbi = address;
188
189	ret = cio_commit_config(sch);
190	if (!mme && ret == -ENODEV) {
191		/*
192		 * The task was to disable measurement block updates but
193		 * the subchannel is already gone. Report success.
194		 */
195		ret = 0;
196	}
197	return ret;
198}
199
200struct set_schib_struct {
201	u32 mme;
202	int mbfc;
203	unsigned long address;
204	wait_queue_head_t wait;
205	int ret;
206};
207
208#define CMF_PENDING 1
209#define SET_SCHIB_TIMEOUT (10 * HZ)
210
211static int set_schib_wait(struct ccw_device *cdev, u32 mme,
212			  int mbfc, unsigned long address)
213{
214	struct set_schib_struct set_data;
215	int ret = -ENODEV;
216
217	spin_lock_irq(cdev->ccwlock);
218	if (!cdev->private->cmb)
219		goto out;
220
221	ret = set_schib(cdev, mme, mbfc, address);
222	if (ret != -EBUSY)
223		goto out;
224
225	/* if the device is not online, don't even try again */
226	if (cdev->private->state != DEV_STATE_ONLINE)
227		goto out;
228
229	init_waitqueue_head(&set_data.wait);
230	set_data.mme = mme;
231	set_data.mbfc = mbfc;
232	set_data.address = address;
233	set_data.ret = CMF_PENDING;
234
235	cdev->private->state = DEV_STATE_CMFCHANGE;
236	cdev->private->cmb_wait = &set_data;
237	spin_unlock_irq(cdev->ccwlock);
238
239	ret = wait_event_interruptible_timeout(set_data.wait,
240					       set_data.ret != CMF_PENDING,
241					       SET_SCHIB_TIMEOUT);
242	spin_lock_irq(cdev->ccwlock);
243	if (ret <= 0) {
244		if (set_data.ret == CMF_PENDING) {
245			set_data.ret = (ret == 0) ? -ETIME : ret;
246			if (cdev->private->state == DEV_STATE_CMFCHANGE)
247				cdev->private->state = DEV_STATE_ONLINE;
248		}
249	}
250	cdev->private->cmb_wait = NULL;
251	ret = set_data.ret;
252out:
253	spin_unlock_irq(cdev->ccwlock);
254	return ret;
255}
256
257void retry_set_schib(struct ccw_device *cdev)
258{
259	struct set_schib_struct *set_data = cdev->private->cmb_wait;
260
261	if (!set_data)
262		return;
263
264	set_data->ret = set_schib(cdev, set_data->mme, set_data->mbfc,
265				  set_data->address);
266	wake_up(&set_data->wait);
267}
268
269static int cmf_copy_block(struct ccw_device *cdev)
270{
271	struct subchannel *sch = to_subchannel(cdev->dev.parent);
272	struct cmb_data *cmb_data;
273	void *hw_block;
274
275	if (cio_update_schib(sch))
276		return -ENODEV;
277
278	if (scsw_fctl(&sch->schib.scsw) & SCSW_FCTL_START_FUNC) {
279		/* Don't copy if a start function is in progress. */
280		if ((!(scsw_actl(&sch->schib.scsw) & SCSW_ACTL_SUSPENDED)) &&
281		    (scsw_actl(&sch->schib.scsw) &
282		     (SCSW_ACTL_DEVACT | SCSW_ACTL_SCHACT)) &&
283		    (!(scsw_stctl(&sch->schib.scsw) & SCSW_STCTL_SEC_STATUS)))
284			return -EBUSY;
285	}
286	cmb_data = cdev->private->cmb;
287	hw_block = cmb_data->hw_block;
288	memcpy(cmb_data->last_block, hw_block, cmb_data->size);
289	cmb_data->last_update = get_tod_clock();
290	return 0;
291}
292
293struct copy_block_struct {
294	wait_queue_head_t wait;
295	int ret;
296};
297
298static int cmf_cmb_copy_wait(struct ccw_device *cdev)
299{
300	struct copy_block_struct copy_block;
301	int ret = -ENODEV;
302
303	spin_lock_irq(cdev->ccwlock);
304	if (!cdev->private->cmb)
305		goto out;
306
307	ret = cmf_copy_block(cdev);
308	if (ret != -EBUSY)
309		goto out;
310
311	if (cdev->private->state != DEV_STATE_ONLINE)
312		goto out;
313
314	init_waitqueue_head(&copy_block.wait);
315	copy_block.ret = CMF_PENDING;
316
317	cdev->private->state = DEV_STATE_CMFUPDATE;
318	cdev->private->cmb_wait = &copy_block;
319	spin_unlock_irq(cdev->ccwlock);
320
321	ret = wait_event_interruptible(copy_block.wait,
322				       copy_block.ret != CMF_PENDING);
323	spin_lock_irq(cdev->ccwlock);
324	if (ret) {
325		if (copy_block.ret == CMF_PENDING) {
326			copy_block.ret = -ERESTARTSYS;
327			if (cdev->private->state == DEV_STATE_CMFUPDATE)
328				cdev->private->state = DEV_STATE_ONLINE;
329		}
330	}
331	cdev->private->cmb_wait = NULL;
332	ret = copy_block.ret;
333out:
334	spin_unlock_irq(cdev->ccwlock);
335	return ret;
336}
337
338void cmf_retry_copy_block(struct ccw_device *cdev)
339{
340	struct copy_block_struct *copy_block = cdev->private->cmb_wait;
341
342	if (!copy_block)
343		return;
344
345	copy_block->ret = cmf_copy_block(cdev);
346	wake_up(&copy_block->wait);
347}
348
349static void cmf_generic_reset(struct ccw_device *cdev)
350{
351	struct cmb_data *cmb_data;
352
353	spin_lock_irq(cdev->ccwlock);
354	cmb_data = cdev->private->cmb;
355	if (cmb_data) {
356		memset(cmb_data->last_block, 0, cmb_data->size);
357		/*
358		 * Need to reset hw block as well to make the hardware start
359		 * from 0 again.
360		 */
361		memset(cmb_data->hw_block, 0, cmb_data->size);
362		cmb_data->last_update = 0;
363	}
364	cdev->private->cmb_start_time = get_tod_clock();
365	spin_unlock_irq(cdev->ccwlock);
366}
367
368/**
369 * struct cmb_area - container for global cmb data
370 *
371 * @mem:	pointer to CMBs (only in basic measurement mode)
372 * @list:	contains a linked list of all subchannels
373 * @num_channels: number of channels to be measured
374 * @lock:	protect concurrent access to @mem and @list
375 */
376struct cmb_area {
377	struct cmb *mem;
378	struct list_head list;
379	int num_channels;
380	spinlock_t lock;
381};
382
383static struct cmb_area cmb_area = {
384	.lock = __SPIN_LOCK_UNLOCKED(cmb_area.lock),
385	.list = LIST_HEAD_INIT(cmb_area.list),
386	.num_channels  = 1024,
387};
388
389/* ****** old style CMB handling ********/
390
391/*
392 * Basic channel measurement blocks are allocated in one contiguous
393 * block of memory, which can not be moved as long as any channel
394 * is active. Therefore, a maximum number of subchannels needs to
395 * be defined somewhere. This is a module parameter, defaulting to
396 * a reasonable value of 1024, or 32 kb of memory.
397 * Current kernels don't allow kmalloc with more than 128kb, so the
398 * maximum is 4096.
399 */
400
401module_param_named(maxchannels, cmb_area.num_channels, uint, 0444);
402
403/**
404 * struct cmb - basic channel measurement block
405 * @ssch_rsch_count: number of ssch and rsch
406 * @sample_count: number of samples
407 * @device_connect_time: time of device connect
408 * @function_pending_time: time of function pending
409 * @device_disconnect_time: time of device disconnect
410 * @control_unit_queuing_time: time of control unit queuing
411 * @device_active_only_time: time of device active only
412 * @reserved: unused in basic measurement mode
413 *
414 * The measurement block as used by the hardware. The fields are described
415 * further in z/Architecture Principles of Operation, chapter 17.
416 *
417 * The cmb area made up from these blocks must be a contiguous array and may
418 * not be reallocated or freed.
419 * Only one cmb area can be present in the system.
420 */
421struct cmb {
422	u16 ssch_rsch_count;
423	u16 sample_count;
424	u32 device_connect_time;
425	u32 function_pending_time;
426	u32 device_disconnect_time;
427	u32 control_unit_queuing_time;
428	u32 device_active_only_time;
429	u32 reserved[2];
430};
431
432/*
433 * Insert a single device into the cmb_area list.
434 * Called with cmb_area.lock held from alloc_cmb.
435 */
436static int alloc_cmb_single(struct ccw_device *cdev,
437			    struct cmb_data *cmb_data)
438{
439	struct cmb *cmb;
440	struct ccw_device_private *node;
441	int ret;
442
443	spin_lock_irq(cdev->ccwlock);
444	if (!list_empty(&cdev->private->cmb_list)) {
445		ret = -EBUSY;
446		goto out;
447	}
448
449	/*
450	 * Find first unused cmb in cmb_area.mem.
451	 * This is a little tricky: cmb_area.list
452	 * remains sorted by ->cmb->hw_data pointers.
453	 */
454	cmb = cmb_area.mem;
455	list_for_each_entry(node, &cmb_area.list, cmb_list) {
456		struct cmb_data *data;
457		data = node->cmb;
458		if ((struct cmb*)data->hw_block > cmb)
459			break;
460		cmb++;
461	}
462	if (cmb - cmb_area.mem >= cmb_area.num_channels) {
463		ret = -ENOMEM;
464		goto out;
465	}
466
467	/* insert new cmb */
468	list_add_tail(&cdev->private->cmb_list, &node->cmb_list);
469	cmb_data->hw_block = cmb;
470	cdev->private->cmb = cmb_data;
471	ret = 0;
472out:
473	spin_unlock_irq(cdev->ccwlock);
474	return ret;
475}
476
477static int alloc_cmb(struct ccw_device *cdev)
478{
479	int ret;
480	struct cmb *mem;
481	ssize_t size;
482	struct cmb_data *cmb_data;
483
484	/* Allocate private cmb_data. */
485	cmb_data = kzalloc(sizeof(struct cmb_data), GFP_KERNEL);
486	if (!cmb_data)
487		return -ENOMEM;
488
489	cmb_data->last_block = kzalloc(sizeof(struct cmb), GFP_KERNEL);
490	if (!cmb_data->last_block) {
491		kfree(cmb_data);
492		return -ENOMEM;
493	}
494	cmb_data->size = sizeof(struct cmb);
495	spin_lock(&cmb_area.lock);
496
497	if (!cmb_area.mem) {
498		/* there is no user yet, so we need a new area */
499		size = sizeof(struct cmb) * cmb_area.num_channels;
500		WARN_ON(!list_empty(&cmb_area.list));
501
502		spin_unlock(&cmb_area.lock);
503		mem = (void*)__get_free_pages(GFP_KERNEL | GFP_DMA,
504				 get_order(size));
505		spin_lock(&cmb_area.lock);
506
507		if (cmb_area.mem) {
508			/* ok, another thread was faster */
509			free_pages((unsigned long)mem, get_order(size));
510		} else if (!mem) {
511			/* no luck */
512			ret = -ENOMEM;
513			goto out;
514		} else {
515			/* everything ok */
516			memset(mem, 0, size);
517			cmb_area.mem = mem;
518			cmf_activate(cmb_area.mem, CMF_ON);
519		}
520	}
521
522	/* do the actual allocation */
523	ret = alloc_cmb_single(cdev, cmb_data);
524out:
525	spin_unlock(&cmb_area.lock);
526	if (ret) {
527		kfree(cmb_data->last_block);
528		kfree(cmb_data);
529	}
530	return ret;
531}
532
533static void free_cmb(struct ccw_device *cdev)
534{
535	struct ccw_device_private *priv;
536	struct cmb_data *cmb_data;
537
538	spin_lock(&cmb_area.lock);
539	spin_lock_irq(cdev->ccwlock);
540
541	priv = cdev->private;
542	cmb_data = priv->cmb;
543	priv->cmb = NULL;
544	if (cmb_data)
545		kfree(cmb_data->last_block);
546	kfree(cmb_data);
547	list_del_init(&priv->cmb_list);
548
549	if (list_empty(&cmb_area.list)) {
550		ssize_t size;
551		size = sizeof(struct cmb) * cmb_area.num_channels;
552		cmf_activate(NULL, CMF_OFF);
553		free_pages((unsigned long)cmb_area.mem, get_order(size));
554		cmb_area.mem = NULL;
555	}
556	spin_unlock_irq(cdev->ccwlock);
557	spin_unlock(&cmb_area.lock);
558}
559
560static int set_cmb(struct ccw_device *cdev, u32 mme)
561{
562	u16 offset;
563	struct cmb_data *cmb_data;
564	unsigned long flags;
565
566	spin_lock_irqsave(cdev->ccwlock, flags);
567	if (!cdev->private->cmb) {
568		spin_unlock_irqrestore(cdev->ccwlock, flags);
569		return -EINVAL;
570	}
571	cmb_data = cdev->private->cmb;
572	offset = mme ? (struct cmb *)cmb_data->hw_block - cmb_area.mem : 0;
573	spin_unlock_irqrestore(cdev->ccwlock, flags);
574
575	return set_schib_wait(cdev, mme, 0, offset);
576}
577
578/* calculate utilization in 0.1 percent units */
579static u64 __cmb_utilization(u64 device_connect_time, u64 function_pending_time,
580			     u64 device_disconnect_time, u64 start_time)
581{
582	u64 utilization, elapsed_time;
583
584	utilization = time_to_nsec(device_connect_time +
585				   function_pending_time +
586				   device_disconnect_time);
587
588	elapsed_time = get_tod_clock() - start_time;
589	elapsed_time = tod_to_ns(elapsed_time);
590	elapsed_time /= 1000;
591
592	return elapsed_time ? (utilization / elapsed_time) : 0;
593}
594
595static u64 read_cmb(struct ccw_device *cdev, int index)
596{
597	struct cmb_data *cmb_data;
598	unsigned long flags;
599	struct cmb *cmb;
600	u64 ret = 0;
601	u32 val;
602
603	spin_lock_irqsave(cdev->ccwlock, flags);
604	cmb_data = cdev->private->cmb;
605	if (!cmb_data)
606		goto out;
607
608	cmb = cmb_data->hw_block;
609	switch (index) {
610	case avg_utilization:
611		ret = __cmb_utilization(cmb->device_connect_time,
612					cmb->function_pending_time,
613					cmb->device_disconnect_time,
614					cdev->private->cmb_start_time);
615		goto out;
616	case cmb_ssch_rsch_count:
617		ret = cmb->ssch_rsch_count;
618		goto out;
619	case cmb_sample_count:
620		ret = cmb->sample_count;
621		goto out;
622	case cmb_device_connect_time:
623		val = cmb->device_connect_time;
624		break;
625	case cmb_function_pending_time:
626		val = cmb->function_pending_time;
627		break;
628	case cmb_device_disconnect_time:
629		val = cmb->device_disconnect_time;
630		break;
631	case cmb_control_unit_queuing_time:
632		val = cmb->control_unit_queuing_time;
633		break;
634	case cmb_device_active_only_time:
635		val = cmb->device_active_only_time;
636		break;
637	default:
638		goto out;
639	}
640	ret = time_to_avg_nsec(val, cmb->sample_count);
641out:
642	spin_unlock_irqrestore(cdev->ccwlock, flags);
643	return ret;
644}
645
646static int readall_cmb(struct ccw_device *cdev, struct cmbdata *data)
647{
648	struct cmb *cmb;
649	struct cmb_data *cmb_data;
650	u64 time;
651	unsigned long flags;
652	int ret;
653
654	ret = cmf_cmb_copy_wait(cdev);
655	if (ret < 0)
656		return ret;
657	spin_lock_irqsave(cdev->ccwlock, flags);
658	cmb_data = cdev->private->cmb;
659	if (!cmb_data) {
660		ret = -ENODEV;
661		goto out;
662	}
663	if (cmb_data->last_update == 0) {
664		ret = -EAGAIN;
665		goto out;
666	}
667	cmb = cmb_data->last_block;
668	time = cmb_data->last_update - cdev->private->cmb_start_time;
669
670	memset(data, 0, sizeof(struct cmbdata));
671
672	/* we only know values before device_busy_time */
673	data->size = offsetof(struct cmbdata, device_busy_time);
674
675	data->elapsed_time = tod_to_ns(time);
676
677	/* copy data to new structure */
678	data->ssch_rsch_count = cmb->ssch_rsch_count;
679	data->sample_count = cmb->sample_count;
680
681	/* time fields are converted to nanoseconds while copying */
682	data->device_connect_time = time_to_nsec(cmb->device_connect_time);
683	data->function_pending_time = time_to_nsec(cmb->function_pending_time);
684	data->device_disconnect_time =
685		time_to_nsec(cmb->device_disconnect_time);
686	data->control_unit_queuing_time
687		= time_to_nsec(cmb->control_unit_queuing_time);
688	data->device_active_only_time
689		= time_to_nsec(cmb->device_active_only_time);
690	ret = 0;
691out:
692	spin_unlock_irqrestore(cdev->ccwlock, flags);
693	return ret;
694}
695
696static void reset_cmb(struct ccw_device *cdev)
697{
698	cmf_generic_reset(cdev);
699}
700
701static int cmf_enabled(struct ccw_device *cdev)
702{
703	int enabled;
704
705	spin_lock_irq(cdev->ccwlock);
706	enabled = !!cdev->private->cmb;
707	spin_unlock_irq(cdev->ccwlock);
708
709	return enabled;
710}
711
712static struct attribute_group cmf_attr_group;
713
714static struct cmb_operations cmbops_basic = {
715	.alloc	= alloc_cmb,
716	.free	= free_cmb,
717	.set	= set_cmb,
718	.read	= read_cmb,
719	.readall    = readall_cmb,
720	.reset	    = reset_cmb,
721	.attr_group = &cmf_attr_group,
722};
723
724/* ******** extended cmb handling ********/
725
726/**
727 * struct cmbe - extended channel measurement block
728 * @ssch_rsch_count: number of ssch and rsch
729 * @sample_count: number of samples
730 * @device_connect_time: time of device connect
731 * @function_pending_time: time of function pending
732 * @device_disconnect_time: time of device disconnect
733 * @control_unit_queuing_time: time of control unit queuing
734 * @device_active_only_time: time of device active only
735 * @device_busy_time: time of device busy
736 * @initial_command_response_time: initial command response time
737 * @reserved: unused
738 *
739 * The measurement block as used by the hardware. May be in any 64 bit physical
740 * location.
741 * The fields are described further in z/Architecture Principles of Operation,
742 * third edition, chapter 17.
743 */
744struct cmbe {
745	u32 ssch_rsch_count;
746	u32 sample_count;
747	u32 device_connect_time;
748	u32 function_pending_time;
749	u32 device_disconnect_time;
750	u32 control_unit_queuing_time;
751	u32 device_active_only_time;
752	u32 device_busy_time;
753	u32 initial_command_response_time;
754	u32 reserved[7];
755} __packed __aligned(64);
756
757static struct kmem_cache *cmbe_cache;
758
759static int alloc_cmbe(struct ccw_device *cdev)
760{
761	struct cmb_data *cmb_data;
762	struct cmbe *cmbe;
763	int ret = -ENOMEM;
764
765	cmbe = kmem_cache_zalloc(cmbe_cache, GFP_KERNEL);
766	if (!cmbe)
767		return ret;
768
769	cmb_data = kzalloc(sizeof(*cmb_data), GFP_KERNEL);
770	if (!cmb_data)
771		goto out_free;
772
773	cmb_data->last_block = kzalloc(sizeof(struct cmbe), GFP_KERNEL);
774	if (!cmb_data->last_block)
775		goto out_free;
776
777	cmb_data->size = sizeof(*cmbe);
778	cmb_data->hw_block = cmbe;
779
780	spin_lock(&cmb_area.lock);
781	spin_lock_irq(cdev->ccwlock);
782	if (cdev->private->cmb)
783		goto out_unlock;
784
785	cdev->private->cmb = cmb_data;
786
787	/* activate global measurement if this is the first channel */
788	if (list_empty(&cmb_area.list))
789		cmf_activate(NULL, CMF_ON);
790	list_add_tail(&cdev->private->cmb_list, &cmb_area.list);
791
792	spin_unlock_irq(cdev->ccwlock);
793	spin_unlock(&cmb_area.lock);
794	return 0;
795
796out_unlock:
797	spin_unlock_irq(cdev->ccwlock);
798	spin_unlock(&cmb_area.lock);
799	ret = -EBUSY;
800out_free:
801	if (cmb_data)
802		kfree(cmb_data->last_block);
803	kfree(cmb_data);
804	kmem_cache_free(cmbe_cache, cmbe);
805
806	return ret;
807}
808
809static void free_cmbe(struct ccw_device *cdev)
810{
811	struct cmb_data *cmb_data;
812
813	spin_lock(&cmb_area.lock);
814	spin_lock_irq(cdev->ccwlock);
815	cmb_data = cdev->private->cmb;
816	cdev->private->cmb = NULL;
817	if (cmb_data) {
818		kfree(cmb_data->last_block);
819		kmem_cache_free(cmbe_cache, cmb_data->hw_block);
820	}
821	kfree(cmb_data);
822
823	/* deactivate global measurement if this is the last channel */
824	list_del_init(&cdev->private->cmb_list);
825	if (list_empty(&cmb_area.list))
826		cmf_activate(NULL, CMF_OFF);
827	spin_unlock_irq(cdev->ccwlock);
828	spin_unlock(&cmb_area.lock);
829}
830
831static int set_cmbe(struct ccw_device *cdev, u32 mme)
832{
833	unsigned long mba;
834	struct cmb_data *cmb_data;
835	unsigned long flags;
836
837	spin_lock_irqsave(cdev->ccwlock, flags);
838	if (!cdev->private->cmb) {
839		spin_unlock_irqrestore(cdev->ccwlock, flags);
840		return -EINVAL;
841	}
842	cmb_data = cdev->private->cmb;
843	mba = mme ? (unsigned long) cmb_data->hw_block : 0;
844	spin_unlock_irqrestore(cdev->ccwlock, flags);
845
846	return set_schib_wait(cdev, mme, 1, mba);
847}
848
849static u64 read_cmbe(struct ccw_device *cdev, int index)
850{
851	struct cmb_data *cmb_data;
852	unsigned long flags;
853	struct cmbe *cmb;
854	u64 ret = 0;
855	u32 val;
856
857	spin_lock_irqsave(cdev->ccwlock, flags);
858	cmb_data = cdev->private->cmb;
859	if (!cmb_data)
860		goto out;
861
862	cmb = cmb_data->hw_block;
863	switch (index) {
864	case avg_utilization:
865		ret = __cmb_utilization(cmb->device_connect_time,
866					cmb->function_pending_time,
867					cmb->device_disconnect_time,
868					cdev->private->cmb_start_time);
869		goto out;
870	case cmb_ssch_rsch_count:
871		ret = cmb->ssch_rsch_count;
872		goto out;
873	case cmb_sample_count:
874		ret = cmb->sample_count;
875		goto out;
876	case cmb_device_connect_time:
877		val = cmb->device_connect_time;
878		break;
879	case cmb_function_pending_time:
880		val = cmb->function_pending_time;
881		break;
882	case cmb_device_disconnect_time:
883		val = cmb->device_disconnect_time;
884		break;
885	case cmb_control_unit_queuing_time:
886		val = cmb->control_unit_queuing_time;
887		break;
888	case cmb_device_active_only_time:
889		val = cmb->device_active_only_time;
890		break;
891	case cmb_device_busy_time:
892		val = cmb->device_busy_time;
893		break;
894	case cmb_initial_command_response_time:
895		val = cmb->initial_command_response_time;
896		break;
897	default:
898		goto out;
899	}
900	ret = time_to_avg_nsec(val, cmb->sample_count);
901out:
902	spin_unlock_irqrestore(cdev->ccwlock, flags);
903	return ret;
904}
905
906static int readall_cmbe(struct ccw_device *cdev, struct cmbdata *data)
907{
908	struct cmbe *cmb;
909	struct cmb_data *cmb_data;
910	u64 time;
911	unsigned long flags;
912	int ret;
913
914	ret = cmf_cmb_copy_wait(cdev);
915	if (ret < 0)
916		return ret;
917	spin_lock_irqsave(cdev->ccwlock, flags);
918	cmb_data = cdev->private->cmb;
919	if (!cmb_data) {
920		ret = -ENODEV;
921		goto out;
922	}
923	if (cmb_data->last_update == 0) {
924		ret = -EAGAIN;
925		goto out;
926	}
927	time = cmb_data->last_update - cdev->private->cmb_start_time;
928
929	memset (data, 0, sizeof(struct cmbdata));
930
931	/* we only know values before device_busy_time */
932	data->size = offsetof(struct cmbdata, device_busy_time);
933
934	data->elapsed_time = tod_to_ns(time);
935
936	cmb = cmb_data->last_block;
937	/* copy data to new structure */
938	data->ssch_rsch_count = cmb->ssch_rsch_count;
939	data->sample_count = cmb->sample_count;
940
941	/* time fields are converted to nanoseconds while copying */
942	data->device_connect_time = time_to_nsec(cmb->device_connect_time);
943	data->function_pending_time = time_to_nsec(cmb->function_pending_time);
944	data->device_disconnect_time =
945		time_to_nsec(cmb->device_disconnect_time);
946	data->control_unit_queuing_time
947		= time_to_nsec(cmb->control_unit_queuing_time);
948	data->device_active_only_time
949		= time_to_nsec(cmb->device_active_only_time);
950	data->device_busy_time = time_to_nsec(cmb->device_busy_time);
951	data->initial_command_response_time
952		= time_to_nsec(cmb->initial_command_response_time);
953
954	ret = 0;
955out:
956	spin_unlock_irqrestore(cdev->ccwlock, flags);
957	return ret;
958}
959
960static void reset_cmbe(struct ccw_device *cdev)
961{
962	cmf_generic_reset(cdev);
963}
964
965static struct attribute_group cmf_attr_group_ext;
966
967static struct cmb_operations cmbops_extended = {
968	.alloc	    = alloc_cmbe,
969	.free	    = free_cmbe,
970	.set	    = set_cmbe,
971	.read	    = read_cmbe,
972	.readall    = readall_cmbe,
973	.reset	    = reset_cmbe,
974	.attr_group = &cmf_attr_group_ext,
975};
976
977static ssize_t cmb_show_attr(struct device *dev, char *buf, enum cmb_index idx)
978{
979	return sprintf(buf, "%lld\n",
980		(unsigned long long) cmf_read(to_ccwdev(dev), idx));
981}
982
983static ssize_t cmb_show_avg_sample_interval(struct device *dev,
984					    struct device_attribute *attr,
985					    char *buf)
986{
987	struct ccw_device *cdev = to_ccwdev(dev);
988	unsigned long count;
989	long interval;
990
991	count = cmf_read(cdev, cmb_sample_count);
992	spin_lock_irq(cdev->ccwlock);
993	if (count) {
994		interval = get_tod_clock() - cdev->private->cmb_start_time;
995		interval = tod_to_ns(interval);
996		interval /= count;
997	} else
998		interval = -1;
999	spin_unlock_irq(cdev->ccwlock);
1000	return sprintf(buf, "%ld\n", interval);
1001}
1002
1003static ssize_t cmb_show_avg_utilization(struct device *dev,
1004					struct device_attribute *attr,
1005					char *buf)
1006{
1007	unsigned long u = cmf_read(to_ccwdev(dev), avg_utilization);
1008
1009	return sprintf(buf, "%02lu.%01lu%%\n", u / 10, u % 10);
1010}
1011
1012#define cmf_attr(name) \
1013static ssize_t show_##name(struct device *dev, \
1014			   struct device_attribute *attr, char *buf)	\
1015{ return cmb_show_attr((dev), buf, cmb_##name); } \
1016static DEVICE_ATTR(name, 0444, show_##name, NULL);
1017
1018#define cmf_attr_avg(name) \
1019static ssize_t show_avg_##name(struct device *dev, \
1020			       struct device_attribute *attr, char *buf) \
1021{ return cmb_show_attr((dev), buf, cmb_##name); } \
1022static DEVICE_ATTR(avg_##name, 0444, show_avg_##name, NULL);
1023
1024cmf_attr(ssch_rsch_count);
1025cmf_attr(sample_count);
1026cmf_attr_avg(device_connect_time);
1027cmf_attr_avg(function_pending_time);
1028cmf_attr_avg(device_disconnect_time);
1029cmf_attr_avg(control_unit_queuing_time);
1030cmf_attr_avg(device_active_only_time);
1031cmf_attr_avg(device_busy_time);
1032cmf_attr_avg(initial_command_response_time);
1033
1034static DEVICE_ATTR(avg_sample_interval, 0444, cmb_show_avg_sample_interval,
1035		   NULL);
1036static DEVICE_ATTR(avg_utilization, 0444, cmb_show_avg_utilization, NULL);
1037
1038static struct attribute *cmf_attributes[] = {
1039	&dev_attr_avg_sample_interval.attr,
1040	&dev_attr_avg_utilization.attr,
1041	&dev_attr_ssch_rsch_count.attr,
1042	&dev_attr_sample_count.attr,
1043	&dev_attr_avg_device_connect_time.attr,
1044	&dev_attr_avg_function_pending_time.attr,
1045	&dev_attr_avg_device_disconnect_time.attr,
1046	&dev_attr_avg_control_unit_queuing_time.attr,
1047	&dev_attr_avg_device_active_only_time.attr,
1048	NULL,
1049};
1050
1051static struct attribute_group cmf_attr_group = {
1052	.name  = "cmf",
1053	.attrs = cmf_attributes,
1054};
1055
1056static struct attribute *cmf_attributes_ext[] = {
1057	&dev_attr_avg_sample_interval.attr,
1058	&dev_attr_avg_utilization.attr,
1059	&dev_attr_ssch_rsch_count.attr,
1060	&dev_attr_sample_count.attr,
1061	&dev_attr_avg_device_connect_time.attr,
1062	&dev_attr_avg_function_pending_time.attr,
1063	&dev_attr_avg_device_disconnect_time.attr,
1064	&dev_attr_avg_control_unit_queuing_time.attr,
1065	&dev_attr_avg_device_active_only_time.attr,
1066	&dev_attr_avg_device_busy_time.attr,
1067	&dev_attr_avg_initial_command_response_time.attr,
1068	NULL,
1069};
1070
1071static struct attribute_group cmf_attr_group_ext = {
1072	.name  = "cmf",
1073	.attrs = cmf_attributes_ext,
1074};
1075
1076static ssize_t cmb_enable_show(struct device *dev,
1077			       struct device_attribute *attr,
1078			       char *buf)
1079{
1080	struct ccw_device *cdev = to_ccwdev(dev);
1081
1082	return sprintf(buf, "%d\n", cmf_enabled(cdev));
1083}
1084
1085static ssize_t cmb_enable_store(struct device *dev,
1086				struct device_attribute *attr, const char *buf,
1087				size_t c)
1088{
1089	struct ccw_device *cdev = to_ccwdev(dev);
1090	unsigned long val;
1091	int ret;
1092
1093	ret = kstrtoul(buf, 16, &val);
1094	if (ret)
1095		return ret;
1096
1097	switch (val) {
1098	case 0:
1099		ret = disable_cmf(cdev);
1100		break;
1101	case 1:
1102		ret = enable_cmf(cdev);
1103		break;
1104	default:
1105		ret = -EINVAL;
1106	}
1107
1108	return ret ? ret : c;
1109}
1110DEVICE_ATTR_RW(cmb_enable);
1111
1112int ccw_set_cmf(struct ccw_device *cdev, int enable)
1113{
1114	return cmbops->set(cdev, enable ? 2 : 0);
1115}
1116
1117/**
1118 * enable_cmf() - switch on the channel measurement for a specific device
1119 *  @cdev:	The ccw device to be enabled
1120 *
1121 *  Enable channel measurements for @cdev. If this is called on a device
1122 *  for which channel measurement is already enabled a reset of the
1123 *  measurement data is triggered.
1124 *  Returns: %0 for success or a negative error value.
1125 *  Context:
1126 *    non-atomic
1127 */
1128int enable_cmf(struct ccw_device *cdev)
1129{
1130	int ret = 0;
1131
1132	device_lock(&cdev->dev);
1133	if (cmf_enabled(cdev)) {
1134		cmbops->reset(cdev);
1135		goto out_unlock;
1136	}
1137	get_device(&cdev->dev);
1138	ret = cmbops->alloc(cdev);
1139	if (ret)
1140		goto out;
1141	cmbops->reset(cdev);
1142	ret = sysfs_create_group(&cdev->dev.kobj, cmbops->attr_group);
1143	if (ret) {
1144		cmbops->free(cdev);
1145		goto out;
1146	}
1147	ret = cmbops->set(cdev, 2);
1148	if (ret) {
1149		sysfs_remove_group(&cdev->dev.kobj, cmbops->attr_group);
1150		cmbops->free(cdev);
1151	}
1152out:
1153	if (ret)
1154		put_device(&cdev->dev);
1155out_unlock:
1156	device_unlock(&cdev->dev);
1157	return ret;
1158}
1159
1160/**
1161 * __disable_cmf() - switch off the channel measurement for a specific device
1162 *  @cdev:	The ccw device to be disabled
1163 *
1164 *  Returns: %0 for success or a negative error value.
1165 *
1166 *  Context:
1167 *    non-atomic, device_lock() held.
1168 */
1169int __disable_cmf(struct ccw_device *cdev)
1170{
1171	int ret;
1172
1173	ret = cmbops->set(cdev, 0);
1174	if (ret)
1175		return ret;
1176
1177	sysfs_remove_group(&cdev->dev.kobj, cmbops->attr_group);
1178	cmbops->free(cdev);
1179	put_device(&cdev->dev);
1180
1181	return ret;
1182}
1183
1184/**
1185 * disable_cmf() - switch off the channel measurement for a specific device
1186 *  @cdev:	The ccw device to be disabled
1187 *
1188 *  Returns: %0 for success or a negative error value.
1189 *
1190 *  Context:
1191 *    non-atomic
1192 */
1193int disable_cmf(struct ccw_device *cdev)
1194{
1195	int ret;
1196
1197	device_lock(&cdev->dev);
1198	ret = __disable_cmf(cdev);
1199	device_unlock(&cdev->dev);
1200
1201	return ret;
1202}
1203
1204/**
1205 * cmf_read() - read one value from the current channel measurement block
1206 * @cdev:	the channel to be read
1207 * @index:	the index of the value to be read
1208 *
1209 * Returns: The value read or %0 if the value cannot be read.
1210 *
1211 *  Context:
1212 *    any
1213 */
1214u64 cmf_read(struct ccw_device *cdev, int index)
1215{
1216	return cmbops->read(cdev, index);
1217}
1218
1219/**
1220 * cmf_readall() - read the current channel measurement block
1221 * @cdev:	the channel to be read
1222 * @data:	a pointer to a data block that will be filled
1223 *
1224 * Returns: %0 on success, a negative error value otherwise.
1225 *
1226 *  Context:
1227 *    any
1228 */
1229int cmf_readall(struct ccw_device *cdev, struct cmbdata *data)
1230{
1231	return cmbops->readall(cdev, data);
1232}
1233
1234/* Reenable cmf when a disconnected device becomes available again. */
1235int cmf_reenable(struct ccw_device *cdev)
1236{
1237	cmbops->reset(cdev);
1238	return cmbops->set(cdev, 2);
1239}
1240
1241/**
1242 * cmf_reactivate() - reactivate measurement block updates
1243 *
1244 * Use this during resume from hibernate.
1245 */
1246void cmf_reactivate(void)
1247{
1248	spin_lock(&cmb_area.lock);
1249	if (!list_empty(&cmb_area.list))
1250		cmf_activate(cmb_area.mem, CMF_ON);
1251	spin_unlock(&cmb_area.lock);
1252}
1253
1254static int __init init_cmbe(void)
1255{
1256	cmbe_cache = kmem_cache_create("cmbe_cache", sizeof(struct cmbe),
1257				       __alignof__(struct cmbe), 0, NULL);
1258
1259	return cmbe_cache ? 0 : -ENOMEM;
1260}
1261
1262static int __init init_cmf(void)
1263{
1264	char *format_string;
1265	char *detect_string;
1266	int ret;
1267
1268	/*
1269	 * If the user did not give a parameter, see if we are running on a
1270	 * machine supporting extended measurement blocks, otherwise fall back
1271	 * to basic mode.
1272	 */
1273	if (format == CMF_AUTODETECT) {
1274		if (!css_general_characteristics.ext_mb) {
1275			format = CMF_BASIC;
1276		} else {
1277			format = CMF_EXTENDED;
1278		}
1279		detect_string = "autodetected";
1280	} else {
1281		detect_string = "parameter";
1282	}
1283
1284	switch (format) {
1285	case CMF_BASIC:
1286		format_string = "basic";
1287		cmbops = &cmbops_basic;
1288		break;
1289	case CMF_EXTENDED:
1290		format_string = "extended";
1291		cmbops = &cmbops_extended;
1292
1293		ret = init_cmbe();
1294		if (ret)
1295			return ret;
1296		break;
1297	default:
1298		return -EINVAL;
1299	}
1300	pr_info("Channel measurement facility initialized using format "
1301		"%s (mode %s)\n", format_string, detect_string);
1302	return 0;
1303}
1304device_initcall(init_cmf);
1305
1306EXPORT_SYMBOL_GPL(enable_cmf);
1307EXPORT_SYMBOL_GPL(disable_cmf);
1308EXPORT_SYMBOL_GPL(cmf_read);
1309EXPORT_SYMBOL_GPL(cmf_readall);
1310