2 #define TRACE_SYSTEM writeback
4 #if !defined(_TRACE_WRITEBACK_H) || defined(TRACE_HEADER_MULTI_READ)
5 #define _TRACE_WRITEBACK_H
7 #include <linux/tracepoint.h>
8 #include <linux/backing-dev.h>
9 #include <linux/writeback.h>
11 #define show_inode_state(state) \
12 __print_flags(state, "|", \
13 {I_DIRTY_SYNC, "I_DIRTY_SYNC"}, \
14 {I_DIRTY_DATASYNC, "I_DIRTY_DATASYNC"}, \
15 {I_DIRTY_PAGES, "I_DIRTY_PAGES"}, \
17 {I_WILL_FREE, "I_WILL_FREE"}, \
18 {I_FREEING, "I_FREEING"}, \
19 {I_CLEAR, "I_CLEAR"}, \
21 {I_DIRTY_TIME, "I_DIRTY_TIME"}, \
22 {I_DIRTY_TIME_EXPIRED, "I_DIRTY_TIME_EXPIRED"}, \
23 {I_REFERENCED, "I_REFERENCED"} \
26 /* enums need to be exported to user space */
29 #define EM(a,b) TRACE_DEFINE_ENUM(a);
30 #define EMe(a,b) TRACE_DEFINE_ENUM(a);
32 #define WB_WORK_REASON \
33 EM( WB_REASON_BACKGROUND, "background") \
34 EM( WB_REASON_TRY_TO_FREE_PAGES, "try_to_free_pages") \
35 EM( WB_REASON_SYNC, "sync") \
36 EM( WB_REASON_PERIODIC, "periodic") \
37 EM( WB_REASON_LAPTOP_TIMER, "laptop_timer") \
38 EM( WB_REASON_FREE_MORE_MEM, "free_more_memory") \
39 EM( WB_REASON_FS_FREE_SPACE, "fs_free_space") \
40 EMe(WB_REASON_FORKER_THREAD, "forker_thread")
45 * Now redefine the EM() and EMe() macros to map the enums to the strings
46 * that will be printed in the output.
50 #define EM(a,b) { a, b },
51 #define EMe(a,b) { a, b }
53 struct wb_writeback_work;
55 TRACE_EVENT(writeback_dirty_page,
57 TP_PROTO(struct page *page, struct address_space *mapping),
59 TP_ARGS(page, mapping),
62 __array(char, name, 32)
63 __field(unsigned long, ino)
64 __field(pgoff_t, index)
68 strscpy_pad(__entry->name,
69 bdi_dev_name(mapping ? inode_to_bdi(mapping->host) :
71 __entry->ino = mapping ? mapping->host->i_ino : 0;
72 __entry->index = page->index;
75 TP_printk("bdi %s: ino=%lu index=%lu",
82 DECLARE_EVENT_CLASS(writeback_dirty_inode_template,
84 TP_PROTO(struct inode *inode, int flags),
86 TP_ARGS(inode, flags),
89 __array(char, name, 32)
90 __field(unsigned long, ino)
91 __field(unsigned long, state)
92 __field(unsigned long, flags)
96 struct backing_dev_info *bdi = inode_to_bdi(inode);
98 /* may be called for files on pseudo FSes w/ unregistered bdi */
99 strscpy_pad(__entry->name, bdi_dev_name(bdi), 32);
100 __entry->ino = inode->i_ino;
101 __entry->state = inode->i_state;
102 __entry->flags = flags;
105 TP_printk("bdi %s: ino=%lu state=%s flags=%s",
108 show_inode_state(__entry->state),
109 show_inode_state(__entry->flags)
113 DEFINE_EVENT(writeback_dirty_inode_template, writeback_mark_inode_dirty,
115 TP_PROTO(struct inode *inode, int flags),
117 TP_ARGS(inode, flags)
120 DEFINE_EVENT(writeback_dirty_inode_template, writeback_dirty_inode_start,
122 TP_PROTO(struct inode *inode, int flags),
124 TP_ARGS(inode, flags)
127 DEFINE_EVENT(writeback_dirty_inode_template, writeback_dirty_inode,
129 TP_PROTO(struct inode *inode, int flags),
131 TP_ARGS(inode, flags)
134 #ifdef CREATE_TRACE_POINTS
135 #ifdef CONFIG_CGROUP_WRITEBACK
137 static inline size_t __trace_wb_cgroup_size(struct bdi_writeback *wb)
139 return kernfs_path_len(wb->memcg_css->cgroup->kn) + 1;
142 static inline void __trace_wb_assign_cgroup(char *buf, struct bdi_writeback *wb)
144 struct cgroup *cgrp = wb->memcg_css->cgroup;
147 path = cgroup_path(cgrp, buf, kernfs_path_len(cgrp->kn) + 1);
148 WARN_ON_ONCE(path != buf);
151 static inline size_t __trace_wbc_cgroup_size(struct writeback_control *wbc)
154 return __trace_wb_cgroup_size(wbc->wb);
159 static inline void __trace_wbc_assign_cgroup(char *buf,
160 struct writeback_control *wbc)
163 __trace_wb_assign_cgroup(buf, wbc->wb);
168 #else /* CONFIG_CGROUP_WRITEBACK */
170 static inline size_t __trace_wb_cgroup_size(struct bdi_writeback *wb)
175 static inline void __trace_wb_assign_cgroup(char *buf, struct bdi_writeback *wb)
180 static inline size_t __trace_wbc_cgroup_size(struct writeback_control *wbc)
185 static inline void __trace_wbc_assign_cgroup(char *buf,
186 struct writeback_control *wbc)
191 #endif /* CONFIG_CGROUP_WRITEBACK */
192 #endif /* CREATE_TRACE_POINTS */
194 DECLARE_EVENT_CLASS(writeback_write_inode_template,
196 TP_PROTO(struct inode *inode, struct writeback_control *wbc),
201 __array(char, name, 32)
202 __field(unsigned long, ino)
203 __field(int, sync_mode)
204 __dynamic_array(char, cgroup, __trace_wbc_cgroup_size(wbc))
208 strscpy_pad(__entry->name,
209 bdi_dev_name(inode_to_bdi(inode)), 32);
210 __entry->ino = inode->i_ino;
211 __entry->sync_mode = wbc->sync_mode;
212 __trace_wbc_assign_cgroup(__get_str(cgroup), wbc);
215 TP_printk("bdi %s: ino=%lu sync_mode=%d cgroup=%s",
223 DEFINE_EVENT(writeback_write_inode_template, writeback_write_inode_start,
225 TP_PROTO(struct inode *inode, struct writeback_control *wbc),
230 DEFINE_EVENT(writeback_write_inode_template, writeback_write_inode,
232 TP_PROTO(struct inode *inode, struct writeback_control *wbc),
237 DECLARE_EVENT_CLASS(writeback_work_class,
238 TP_PROTO(struct bdi_writeback *wb, struct wb_writeback_work *work),
241 __array(char, name, 32)
242 __field(long, nr_pages)
243 __field(dev_t, sb_dev)
244 __field(int, sync_mode)
245 __field(int, for_kupdate)
246 __field(int, range_cyclic)
247 __field(int, for_background)
249 __dynamic_array(char, cgroup, __trace_wb_cgroup_size(wb))
252 strscpy_pad(__entry->name, bdi_dev_name(wb->bdi), 32);
253 __entry->nr_pages = work->nr_pages;
254 __entry->sb_dev = work->sb ? work->sb->s_dev : 0;
255 __entry->sync_mode = work->sync_mode;
256 __entry->for_kupdate = work->for_kupdate;
257 __entry->range_cyclic = work->range_cyclic;
258 __entry->for_background = work->for_background;
259 __entry->reason = work->reason;
260 __trace_wb_assign_cgroup(__get_str(cgroup), wb);
262 TP_printk("bdi %s: sb_dev %d:%d nr_pages=%ld sync_mode=%d "
263 "kupdate=%d range_cyclic=%d background=%d reason=%s cgroup=%s",
265 MAJOR(__entry->sb_dev), MINOR(__entry->sb_dev),
268 __entry->for_kupdate,
269 __entry->range_cyclic,
270 __entry->for_background,
271 __print_symbolic(__entry->reason, WB_WORK_REASON),
275 #define DEFINE_WRITEBACK_WORK_EVENT(name) \
276 DEFINE_EVENT(writeback_work_class, name, \
277 TP_PROTO(struct bdi_writeback *wb, struct wb_writeback_work *work), \
279 DEFINE_WRITEBACK_WORK_EVENT(writeback_queue);
280 DEFINE_WRITEBACK_WORK_EVENT(writeback_exec);
281 DEFINE_WRITEBACK_WORK_EVENT(writeback_start);
282 DEFINE_WRITEBACK_WORK_EVENT(writeback_written);
283 DEFINE_WRITEBACK_WORK_EVENT(writeback_wait);
285 TRACE_EVENT(writeback_pages_written,
286 TP_PROTO(long pages_written),
287 TP_ARGS(pages_written),
292 __entry->pages = pages_written;
294 TP_printk("%ld", __entry->pages)
297 DECLARE_EVENT_CLASS(writeback_class,
298 TP_PROTO(struct bdi_writeback *wb),
301 __array(char, name, 32)
302 __dynamic_array(char, cgroup, __trace_wb_cgroup_size(wb))
305 strscpy_pad(__entry->name, bdi_dev_name(wb->bdi), 32);
306 __trace_wb_assign_cgroup(__get_str(cgroup), wb);
308 TP_printk("bdi %s: cgroup=%s",
313 #define DEFINE_WRITEBACK_EVENT(name) \
314 DEFINE_EVENT(writeback_class, name, \
315 TP_PROTO(struct bdi_writeback *wb), \
318 DEFINE_WRITEBACK_EVENT(writeback_nowork);
319 DEFINE_WRITEBACK_EVENT(writeback_wake_background);
321 TRACE_EVENT(writeback_bdi_register,
322 TP_PROTO(struct backing_dev_info *bdi),
325 __array(char, name, 32)
328 strscpy_pad(__entry->name, bdi_dev_name(bdi), 32);
335 DECLARE_EVENT_CLASS(wbc_class,
336 TP_PROTO(struct writeback_control *wbc, struct backing_dev_info *bdi),
339 __array(char, name, 32)
340 __field(long, nr_to_write)
341 __field(long, pages_skipped)
342 __field(int, sync_mode)
343 __field(int, for_kupdate)
344 __field(int, for_background)
345 __field(int, for_reclaim)
346 __field(int, range_cyclic)
347 __field(long, range_start)
348 __field(long, range_end)
349 __dynamic_array(char, cgroup, __trace_wbc_cgroup_size(wbc))
353 strscpy_pad(__entry->name, bdi_dev_name(bdi), 32);
354 __entry->nr_to_write = wbc->nr_to_write;
355 __entry->pages_skipped = wbc->pages_skipped;
356 __entry->sync_mode = wbc->sync_mode;
357 __entry->for_kupdate = wbc->for_kupdate;
358 __entry->for_background = wbc->for_background;
359 __entry->for_reclaim = wbc->for_reclaim;
360 __entry->range_cyclic = wbc->range_cyclic;
361 __entry->range_start = (long)wbc->range_start;
362 __entry->range_end = (long)wbc->range_end;
363 __trace_wbc_assign_cgroup(__get_str(cgroup), wbc);
366 TP_printk("bdi %s: towrt=%ld skip=%ld mode=%d kupd=%d "
367 "bgrd=%d reclm=%d cyclic=%d "
368 "start=0x%lx end=0x%lx cgroup=%s",
370 __entry->nr_to_write,
371 __entry->pages_skipped,
373 __entry->for_kupdate,
374 __entry->for_background,
375 __entry->for_reclaim,
376 __entry->range_cyclic,
377 __entry->range_start,
383 #define DEFINE_WBC_EVENT(name) \
384 DEFINE_EVENT(wbc_class, name, \
385 TP_PROTO(struct writeback_control *wbc, struct backing_dev_info *bdi), \
387 DEFINE_WBC_EVENT(wbc_writepage);
389 TRACE_EVENT(writeback_queue_io,
390 TP_PROTO(struct bdi_writeback *wb,
391 struct wb_writeback_work *work,
392 unsigned long dirtied_before,
394 TP_ARGS(wb, work, dirtied_before, moved),
396 __array(char, name, 32)
397 __field(unsigned long, older)
401 __dynamic_array(char, cgroup, __trace_wb_cgroup_size(wb))
404 strscpy_pad(__entry->name, bdi_dev_name(wb->bdi), 32);
405 __entry->older = dirtied_before;
406 __entry->age = (jiffies - dirtied_before) * 1000 / HZ;
407 __entry->moved = moved;
408 __entry->reason = work->reason;
409 __trace_wb_assign_cgroup(__get_str(cgroup), wb);
411 TP_printk("bdi %s: older=%lu age=%ld enqueue=%d reason=%s cgroup=%s",
413 __entry->older, /* dirtied_before in jiffies */
414 __entry->age, /* dirtied_before in relative milliseconds */
416 __print_symbolic(__entry->reason, WB_WORK_REASON),
421 TRACE_EVENT(global_dirty_state,
423 TP_PROTO(unsigned long background_thresh,
424 unsigned long dirty_thresh
427 TP_ARGS(background_thresh,
432 __field(unsigned long, nr_dirty)
433 __field(unsigned long, nr_writeback)
434 __field(unsigned long, nr_unstable)
435 __field(unsigned long, background_thresh)
436 __field(unsigned long, dirty_thresh)
437 __field(unsigned long, dirty_limit)
438 __field(unsigned long, nr_dirtied)
439 __field(unsigned long, nr_written)
443 __entry->nr_dirty = global_page_state(NR_FILE_DIRTY);
444 __entry->nr_writeback = global_page_state(NR_WRITEBACK);
445 __entry->nr_unstable = global_page_state(NR_UNSTABLE_NFS);
446 __entry->nr_dirtied = global_page_state(NR_DIRTIED);
447 __entry->nr_written = global_page_state(NR_WRITTEN);
448 __entry->background_thresh = background_thresh;
449 __entry->dirty_thresh = dirty_thresh;
450 __entry->dirty_limit = global_wb_domain.dirty_limit;
453 TP_printk("dirty=%lu writeback=%lu unstable=%lu "
454 "bg_thresh=%lu thresh=%lu limit=%lu "
455 "dirtied=%lu written=%lu",
457 __entry->nr_writeback,
458 __entry->nr_unstable,
459 __entry->background_thresh,
460 __entry->dirty_thresh,
461 __entry->dirty_limit,
467 #define KBps(x) ((x) << (PAGE_SHIFT - 10))
469 TRACE_EVENT(bdi_dirty_ratelimit,
471 TP_PROTO(struct bdi_writeback *wb,
472 unsigned long dirty_rate,
473 unsigned long task_ratelimit),
475 TP_ARGS(wb, dirty_rate, task_ratelimit),
478 __array(char, bdi, 32)
479 __field(unsigned long, write_bw)
480 __field(unsigned long, avg_write_bw)
481 __field(unsigned long, dirty_rate)
482 __field(unsigned long, dirty_ratelimit)
483 __field(unsigned long, task_ratelimit)
484 __field(unsigned long, balanced_dirty_ratelimit)
485 __dynamic_array(char, cgroup, __trace_wb_cgroup_size(wb))
489 strscpy_pad(__entry->bdi, bdi_dev_name(wb->bdi), 32);
490 __entry->write_bw = KBps(wb->write_bandwidth);
491 __entry->avg_write_bw = KBps(wb->avg_write_bandwidth);
492 __entry->dirty_rate = KBps(dirty_rate);
493 __entry->dirty_ratelimit = KBps(wb->dirty_ratelimit);
494 __entry->task_ratelimit = KBps(task_ratelimit);
495 __entry->balanced_dirty_ratelimit =
496 KBps(wb->balanced_dirty_ratelimit);
497 __trace_wb_assign_cgroup(__get_str(cgroup), wb);
501 "write_bw=%lu awrite_bw=%lu dirty_rate=%lu "
502 "dirty_ratelimit=%lu task_ratelimit=%lu "
503 "balanced_dirty_ratelimit=%lu cgroup=%s",
505 __entry->write_bw, /* write bandwidth */
506 __entry->avg_write_bw, /* avg write bandwidth */
507 __entry->dirty_rate, /* bdi dirty rate */
508 __entry->dirty_ratelimit, /* base ratelimit */
509 __entry->task_ratelimit, /* ratelimit with position control */
510 __entry->balanced_dirty_ratelimit, /* the balanced ratelimit */
515 TRACE_EVENT(balance_dirty_pages,
517 TP_PROTO(struct bdi_writeback *wb,
518 unsigned long thresh,
519 unsigned long bg_thresh,
521 unsigned long bdi_thresh,
522 unsigned long bdi_dirty,
523 unsigned long dirty_ratelimit,
524 unsigned long task_ratelimit,
525 unsigned long dirtied,
526 unsigned long period,
528 unsigned long start_time),
530 TP_ARGS(wb, thresh, bg_thresh, dirty, bdi_thresh, bdi_dirty,
531 dirty_ratelimit, task_ratelimit,
532 dirtied, period, pause, start_time),
535 __array( char, bdi, 32)
536 __field(unsigned long, limit)
537 __field(unsigned long, setpoint)
538 __field(unsigned long, dirty)
539 __field(unsigned long, bdi_setpoint)
540 __field(unsigned long, bdi_dirty)
541 __field(unsigned long, dirty_ratelimit)
542 __field(unsigned long, task_ratelimit)
543 __field(unsigned int, dirtied)
544 __field(unsigned int, dirtied_pause)
545 __field(unsigned long, paused)
546 __field( long, pause)
547 __field(unsigned long, period)
548 __field( long, think)
549 __dynamic_array(char, cgroup, __trace_wb_cgroup_size(wb))
553 unsigned long freerun = (thresh + bg_thresh) / 2;
554 strscpy_pad(__entry->bdi, bdi_dev_name(wb->bdi), 32);
556 __entry->limit = global_wb_domain.dirty_limit;
557 __entry->setpoint = (global_wb_domain.dirty_limit +
559 __entry->dirty = dirty;
560 __entry->bdi_setpoint = __entry->setpoint *
561 bdi_thresh / (thresh + 1);
562 __entry->bdi_dirty = bdi_dirty;
563 __entry->dirty_ratelimit = KBps(dirty_ratelimit);
564 __entry->task_ratelimit = KBps(task_ratelimit);
565 __entry->dirtied = dirtied;
566 __entry->dirtied_pause = current->nr_dirtied_pause;
567 __entry->think = current->dirty_paused_when == 0 ? 0 :
568 (long)(jiffies - current->dirty_paused_when) * 1000/HZ;
569 __entry->period = period * 1000 / HZ;
570 __entry->pause = pause * 1000 / HZ;
571 __entry->paused = (jiffies - start_time) * 1000 / HZ;
572 __trace_wb_assign_cgroup(__get_str(cgroup), wb);
577 "limit=%lu setpoint=%lu dirty=%lu "
578 "bdi_setpoint=%lu bdi_dirty=%lu "
579 "dirty_ratelimit=%lu task_ratelimit=%lu "
580 "dirtied=%u dirtied_pause=%u "
581 "paused=%lu pause=%ld period=%lu think=%ld cgroup=%s",
586 __entry->bdi_setpoint,
588 __entry->dirty_ratelimit,
589 __entry->task_ratelimit,
591 __entry->dirtied_pause,
592 __entry->paused, /* ms */
593 __entry->pause, /* ms */
594 __entry->period, /* ms */
595 __entry->think, /* ms */
600 TRACE_EVENT(writeback_sb_inodes_requeue,
602 TP_PROTO(struct inode *inode),
606 __array(char, name, 32)
607 __field(unsigned long, ino)
608 __field(unsigned long, state)
609 __field(unsigned long, dirtied_when)
610 __dynamic_array(char, cgroup,
611 __trace_wb_cgroup_size(inode_to_wb(inode)))
615 strscpy_pad(__entry->name,
616 bdi_dev_name(inode_to_bdi(inode)), 32);
617 __entry->ino = inode->i_ino;
618 __entry->state = inode->i_state;
619 __entry->dirtied_when = inode->dirtied_when;
620 __trace_wb_assign_cgroup(__get_str(cgroup), inode_to_wb(inode));
623 TP_printk("bdi %s: ino=%lu state=%s dirtied_when=%lu age=%lu cgroup=%s",
626 show_inode_state(__entry->state),
627 __entry->dirtied_when,
628 (jiffies - __entry->dirtied_when) / HZ,
633 DECLARE_EVENT_CLASS(writeback_congest_waited_template,
635 TP_PROTO(unsigned int usec_timeout, unsigned int usec_delayed),
637 TP_ARGS(usec_timeout, usec_delayed),
640 __field( unsigned int, usec_timeout )
641 __field( unsigned int, usec_delayed )
645 __entry->usec_timeout = usec_timeout;
646 __entry->usec_delayed = usec_delayed;
649 TP_printk("usec_timeout=%u usec_delayed=%u",
650 __entry->usec_timeout,
651 __entry->usec_delayed)
654 DEFINE_EVENT(writeback_congest_waited_template, writeback_congestion_wait,
656 TP_PROTO(unsigned int usec_timeout, unsigned int usec_delayed),
658 TP_ARGS(usec_timeout, usec_delayed)
661 DEFINE_EVENT(writeback_congest_waited_template, writeback_wait_iff_congested,
663 TP_PROTO(unsigned int usec_timeout, unsigned int usec_delayed),
665 TP_ARGS(usec_timeout, usec_delayed)
668 DECLARE_EVENT_CLASS(writeback_single_inode_template,
670 TP_PROTO(struct inode *inode,
671 struct writeback_control *wbc,
672 unsigned long nr_to_write
675 TP_ARGS(inode, wbc, nr_to_write),
678 __array(char, name, 32)
679 __field(unsigned long, ino)
680 __field(unsigned long, state)
681 __field(unsigned long, dirtied_when)
682 __field(unsigned long, writeback_index)
683 __field(long, nr_to_write)
684 __field(unsigned long, wrote)
685 __dynamic_array(char, cgroup, __trace_wbc_cgroup_size(wbc))
689 strscpy_pad(__entry->name,
690 bdi_dev_name(inode_to_bdi(inode)), 32);
691 __entry->ino = inode->i_ino;
692 __entry->state = inode->i_state;
693 __entry->dirtied_when = inode->dirtied_when;
694 __entry->writeback_index = inode->i_mapping->writeback_index;
695 __entry->nr_to_write = nr_to_write;
696 __entry->wrote = nr_to_write - wbc->nr_to_write;
697 __trace_wbc_assign_cgroup(__get_str(cgroup), wbc);
700 TP_printk("bdi %s: ino=%lu state=%s dirtied_when=%lu age=%lu "
701 "index=%lu to_write=%ld wrote=%lu cgroup=%s",
704 show_inode_state(__entry->state),
705 __entry->dirtied_when,
706 (jiffies - __entry->dirtied_when) / HZ,
707 __entry->writeback_index,
708 __entry->nr_to_write,
714 DEFINE_EVENT(writeback_single_inode_template, writeback_single_inode_start,
715 TP_PROTO(struct inode *inode,
716 struct writeback_control *wbc,
717 unsigned long nr_to_write),
718 TP_ARGS(inode, wbc, nr_to_write)
721 DEFINE_EVENT(writeback_single_inode_template, writeback_single_inode,
722 TP_PROTO(struct inode *inode,
723 struct writeback_control *wbc,
724 unsigned long nr_to_write),
725 TP_ARGS(inode, wbc, nr_to_write)
728 DECLARE_EVENT_CLASS(writeback_lazytime_template,
729 TP_PROTO(struct inode *inode),
734 __field( dev_t, dev )
735 __field(unsigned long, ino )
736 __field(unsigned long, state )
737 __field( __u16, mode )
738 __field(unsigned long, dirtied_when )
742 __entry->dev = inode->i_sb->s_dev;
743 __entry->ino = inode->i_ino;
744 __entry->state = inode->i_state;
745 __entry->mode = inode->i_mode;
746 __entry->dirtied_when = inode->dirtied_when;
749 TP_printk("dev %d,%d ino %lu dirtied %lu state %s mode 0%o",
750 MAJOR(__entry->dev), MINOR(__entry->dev),
751 __entry->ino, __entry->dirtied_when,
752 show_inode_state(__entry->state), __entry->mode)
755 DEFINE_EVENT(writeback_lazytime_template, writeback_lazytime,
756 TP_PROTO(struct inode *inode),
761 DEFINE_EVENT(writeback_lazytime_template, writeback_lazytime_iput,
762 TP_PROTO(struct inode *inode),
767 DEFINE_EVENT(writeback_lazytime_template, writeback_dirty_inode_enqueue,
769 TP_PROTO(struct inode *inode),
774 #endif /* _TRACE_WRITEBACK_H */
776 /* This part must be outside protection */
777 #include <trace/define_trace.h>