mirror of
https://github.com/LineageOS/android_kernel_fxtec_sm6115.git
synced 2026-04-02 04:06:04 +00:00
version 4.19.325-cip123 * tag 'v4.19.325-cip123' of https://git.kernel.org/pub/scm/linux/kernel/git/cip/linux-cip: CIP: Bump version suffix to -cip123 after merge from cip/linux-4.19.y-st tree Update localversion-st, tree is up-to-date with 5.4.296. emulex/benet: Fix build by return mismatch in be_cmd_unlock() net/sched: Abort __tc_modify_qdisc if parent class does not exist mtk-sd: Prevent memory corruption from DMA map failure mmc: mediatek: use data instead of mrq parameter from msdc_{un}prepare_data() scsi: qla4xxx: Fix missing DMA mapping error in qla4xxx_alloc_pdu() btrfs: don't abort filesystem when attempting to snapshot deleted subvolume VMCI: fix race between vmci_host_setup_notify and vmci_ctx_unset_notify net: ipv6: Discard next-hop MTU less than minimum link MTU Input: atkbd - do not skip atkbd_deactivate() when skipping ATKBD_CMD_GETID HID: quirks: Add quirk for 2 Chicony Electronics HP 5MP Cameras HID: Add IGNORE quirk for SMARTLINKTECHNOLOGY vt: add missing notification when switching back to text mode net: usb: qmi_wwan: add SIMCom 8230C composition atm: idt77252: Add missing `dma_map_error()` bnxt_en: Fix DCB ETS validation can: m_can: m_can_handle_lost_msg(): downgrade msg lost in rx message to debug level net: appletalk: Fix device refcount leak in atrtr_create() md/raid1: Fix stack memory use after return in raid1_reshape wifi: zd1211rw: Fix potential NULL pointer dereference in zd_mac_tx_to_dev() dma-buf: fix timeout handling in dma_resv_wait_timeout v2 Input: xpad - support Acer NGR 200 Controller Input: xpad - add VID for Turtle Beach controllers Input: xpad - add support for Amazon Game Controller netlink: Fix rmem check in netlink_broadcast_deliver(). netlink: make sure we allow at least one dump skb Revert "ACPI: battery: negate current when discharging" usb: gadget: u_serial: Fix race condition in TTY wakeup drm/sched: Increment job count before swapping tail spsc queue x86/mce: Make sure CMCI banks are cleared during shutdown on Intel x86/mce: Don't remove sysfs if thresholding sysfs init fails x86/mce/amd: Fix threshold limit reset rxrpc: Fix oops due to non-existence of prealloc backlog struct atm: clip: Fix NULL pointer dereference in vcc_sendmsg() atm: clip: Fix infinite recursive call of clip_push(). atm: clip: Fix memory leak of struct clip_vcc. atm: clip: Fix potential null-ptr-deref in to_atmarpd(). tipc: Fix use-after-free in tipc_conn_close(). netlink: Fix wraparounds of sk->sk_rmem_alloc. fix proc_sys_compare() handling of in-lookup dentries proc: Clear the pieces of proc_inode that proc_evict_inode cares about staging: rtl8723bs: Avoid memset() in aes_cipher() and aes_decipher() media: uvcvideo: Rollback non processed entities on error media: uvcvideo: Send control events for partial succeeds media: uvcvideo: Return the number of processed controls ACPI: PAD: fix crash in exit_round_robin() usb: typec: displayport: Fix potential deadlock Logitech C-270 even more broken rose: fix dangling neighbour pointers in rose_rt_device_down() net: rose: Fix fall-through warnings for Clang ethernet: atl1: Add missing DMA mapping error checks and count errors btrfs: use btrfs_record_snapshot_destroy() during rmdir btrfs: propagate last_unlink_trans earlier when doing a rmdir RDMA/mlx5: Fix CC counters query for MPV scsi: ufs: core: Fix spelling of a sysfs attribute name ACPICA: Refuse to evaluate a method if arguments are missing wifi: ath6kl: remove WARN on bad firmware input wifi: mac80211: drop invalid source address OCB frames powerpc: Fix struct termio related ioctl macros ata: pata_cs5536: fix build on 32-bit UML ALSA: sb: Force to disable DMAs once when DMA mode is changed net/sched: Always pass notifications when child class becomes empty nui: Fix dma_mapping_error() check enic: fix incorrect MTU comparison in enic_change_mtu() amd-xgbe: align CL37 AN sequence as per databook btrfs: fix missing error handling when searching for inode refs during log replay mtk-sd: Fix a pagefault in dma_unmap_sg() for not prepared data usb: typec: altmodes/displayport: do not index invalid pin_assignments Revert "mmc: sdhci: Disable SD card clock before changing parameters" mmc: sdhci: Add a helper function for dump register in dynamic debug mode vsock/vmci: Clear the vmci transport packet properly when initializing it arm64: Restrict pagetable teardown to avoid false warning drm/bridge: cdns-dsi: Fix connecting to next bridge drm/tegra: Assign plane type before registration HID: wacom: fix kobject reference count leak HID: wacom: fix memory leak on sysfs attribute creation failure HID: wacom: fix memory leak on kobject creation failure dm-raid: fix variable in journal device check Bluetooth: L2CAP: Fix L2CAP MTU negotiation atm: Release atm_dev_mutex after removing procfs in atm_dev_deregister(). um: ubd: Add missing error check in start_io_thread() vsock/uapi: fix linux/vm_sockets.h userspace compilation errors wifi: mac80211: fix beacon interval calculation overflow ALSA: usb-audio: Fix out-of-bounds read in snd_usb_get_audioformat_uac3() i2c: robotfuzz-osif: disable zero-length read messages i2c: tiny-usb: disable zero-length read messages RDMA/iwcm: Fix use-after-free of work objects after cm_id destruction RDMA/core: Use refcount_t instead of atomic_t on refcount of iwcm_id_private media: vivid: Change the siize of the composing media: omap3isp: use sgtable-based scatterlist wrappers jfs: validate AG parameters in dbMount() to prevent crashes fs/jfs: consolidate sanity checking in dbMount VMCI: check context->notify_page after call to get_user_pages_fast() to avoid GPF ovl: Check for NULL d_inode() in ovl_dentry_upper() ceph: fix possible integer overflow in ceph_zero_objects() ALSA: hda: Ignore unsol events for cards being shut down usb: typec: displayport: Receive DP Status Update NAK request exit dp altmode usb: cdc-wdm: avoid setting WDM_READ for ZLP-s usb: Add checks for snprintf() calls in usb_alloc_dev() usb: potential integer overflow in usbg_make_tpg() iio: pressure: zpa2326: Use aligned_s64 for the timestamp md/md-bitmap: fix dm-raid max_write_behind setting dmaengine: xilinx_dma: Set dma_device directions mfd: max14577: Fix wakeup source leaks on device unbind mailbox: Not protect module_put with spin_lock_irqsave cifs: Fix cifs_query_path_info() for Windows NT servers CIP: Bump version suffix to -cip122 after merge from cip/linux-4.19.y-st tree Update localversion-st, tree is up-to-date with 5.4.295. ARM: dts: am335x-bone-common: Increase MDIO reset deassert delay to 50ms ARM: dts: am335x-bone-common: Increase MDIO reset deassert time ARM: dts: am335x-bone-common: Add GPIO PHY reset on revision C3 board ARM: dts: am335x-bone-common: get rid of phy_id property mtd: nand: sunxi: Add randomizer configuration before randomizer enable mtd: rawnand: sunxi: Add randomizer configuration in sunxi_nfc_hw_ecc_write_chunk sch_hfsc: Fix qlen accounting bug when using peek in hfsc_enqueue() bridge: netfilter: Fix forwarding of fragmented packets vxlan: Annotate FDB data races hwmon: (gpio-fan) Add missing mutex locks nfs: handle failure of nfs_get_lock_context in unlock path sch_htb: make htb_deactivate() idempotent scsi: qedf: Use designated initializer for struct qed_fcoe_cb_ops arm64/ptrace: Fix stack-out-of-bounds read in regs_get_kernel_stack_nth() perf: Fix sample vs do_exit() jbd2: fix data-race and null-ptr-deref in jbd2_journal_dirty_metadata() mm/huge_memory: fix dereferencing invalid pmd migration entry posix-cpu-timers: fix race between handle_posix_cpu_timers() and posix_cpu_timer_del() net: atm: fix /proc/net/atm/lec handling net: atm: add lec_mutex calipso: Fix null-ptr-deref in calipso_req_{set,del}attr(). tipc: fix null-ptr-deref when acquiring remote ip of ethernet bearer atm: atmtcp: Free invalid length skb in atmtcp_c_send(). mpls: Use rcu_dereference_rtnl() in mpls_route_input_rcu(). wifi: carl9170: do not ping device which has failed to load firmware drm/nouveau/bl: increase buffer size to avoid truncate warning ALSA: hda/realtek: enable headset mic on Latitude 5420 Rugged ALSA: hda/intel: Add Thinkpad E15 to PM deny list Input: sparcspkr - avoid unannotated fall-through HID: usbhid: Eliminate recurrent out-of-bounds bug in usbhid_parse() atm: Revert atm_account_tx() if copy_from_iter_full() fails. selinux: fix selinux_xfrm_alloc_user() to set correct ctx_len scsi: s390: zfcp: Ensure synchronous unit_add jffs2: check jffs2_prealloc_raw_node_refs() result in few other places jffs2: check that raw node were preallocated before writing summary drivers/rapidio/rio_cm.c: prevent possible heap overwrite Revert "x86/bugs: Make spectre user default depend on MITIGATION_SPECTRE_V2" on v6.6 and older powerpc/eeh: Fix missing PE bridge reconfiguration during VFIO EEH recovery platform/x86: dell_rbu: Stop overwriting data buffer tee: Prevent size calculation wraparound on 32-bit kernels ARM: OMAP2+: Fix l4ls clk domain handling in STANDBY bus: fsl-mc: increase MC_CMD_COMPLETION_TIMEOUT_MS value watchdog: da9052_wdt: respect TWDMIN i40e: fix MMIO write access to an invalid page in i40e_clear_hw sock: Correct error checking condition for (assign|release)_proto_idx() vxlan: Do not treat dst cache initialization errors as fatal clk: rockchip: rk3036: mark ddrphy as critical wifi: mac80211: do not offer a mesh path if forwarding is disabled net: mlx4: add SOF_TIMESTAMPING_TX_SOFTWARE flag when getting ts info pinctrl: armada-37xx: propagate error from armada_37xx_gpio_get() pinctrl: armada-37xx: propagate error from armada_37xx_pmx_gpio_set_direction() pinctrl: armada-37xx: propagate error from armada_37xx_gpio_get_direction() pinctrl: armada-37xx: propagate error from armada_37xx_pmx_set_by_name() ipv4/route: Use this_cpu_inc() for stats on PREEMPT_RT tcp: always seek for minimal rtt in tcp_rcv_rtt_update() net: dlink: add synchronization for stats update sctp: Do not wake readers in __sctp_write_space() emulex/benet: correct command version selection in be_cmd_get_stats() i2c: designware: Invoke runtime suspend on quick slave re-registration net: macb: Check return value of dma_set_mask_and_coherent() cpufreq: Force sync policy boost with global boost on sysfs update nios2: force update_mmu_cache on spurious tlb-permission--related pagefaults media: platform: exynos4-is: Add hardware sync wait to fimc_is_hw_change_mode() media: tc358743: ignore video while HPD is low drm/amdkfd: Set SDMA_RLCx_IB_CNTL/SWITCH_INSIDE_IB jfs: Fix null-ptr-deref in jfs_ioc_trim drm/amdgpu/gfx9: fix CSIB handling drm/amdgpu/gfx8: fix CSIB handling jfs: fix array-index-out-of-bounds read in add_missing_indices drm/amdgpu/gfx7: fix CSIB handling drm/amd/display: Add NULL pointer checks in dm_force_atomic_commit() media: uapi: v4l: Fix V4L2_TYPE_IS_OUTPUT condition sunrpc: update nextcheck time when adding new cache entries drm/amdgpu/gfx6: fix CSIB handling ACPI: battery: negate current when discharging power: supply: bq27xxx: Retrieve again when busy ACPICA: fix acpi parse and parseext cache leaks ACPICA: Avoid sequence overread in call to strncmp() ACPICA: fix acpi operand cache leak in dswstate.c PCI: Fix lock symmetry in pci_slot_unlock() regulator: max14577: Add error check for max14577_read_reg() staging: iio: ad5933: Correct settling cycles encoding per datasheet net: ch9200: fix uninitialised access during mii_nway_restart ftrace: Fix UAF when lookup kallsym after ftrace disabled dm-mirror: fix a tiny race condition mm: fix ratelimit_pages update error in dirty_ratio_handler() ipc: fix to protect IPCS lookups using RCU parisc: fix building with gcc-15 vgacon: Add check for vc_origin address range in vgacon_scroll() NFC: nci: uart: Set tty->disc_data only in success path f2fs: prevent kernel warning due to negative i_nlink from corrupted image Input: ims-pcu - check record size in ims_pcu_flash_firmware() ext4: fix calculation of credits for extent tree modification ext4: inline: fix len overflow in ext4_prepare_inline_data ata: pata_via: Force PIO for ATAPI devices on VT6415/VT6330 media: v4l2-dev: fix error handling in __video_register_device() media: gspca: Add error handling for stv06xx_read_sensor() wifi: rtlwifi: disable ASPM for RTL8723BE with subsystem ID 11ad:1723 nfsd: nfsd4_spo_must_allow() must check this is a v4 compound request wifi: p54: prevent buffer-overflow in p54_rx_eeprom_readback() gfs2: move msleep to sleepable context configfs: Do not override creating attribute file failure in populate_attrs() calipso: unlock rcu before returning -EAFNOSUPPORT usb: Flush altsetting 0 endpoints before reinitializating them after reset. fs/filesystems: Fix potential unsigned integer underflow in fs_name() net/mdiobus: Fix potential out-of-bounds read/write access MIPS: Move '-Wa,-msoft-float' check from as-option to cc-option x86/boot/compressed: prefer cc-option for CFLAGS additions net: mdio: C22 is now optional, EOPNOTSUPP if not provided i40e: retry VFLR handling if there is ongoing VF reset i40e: return false from i40e_reset_vf if reset is in progress net_sched: sch_sfq: fix a potential crash on gso_skb handling scsi: iscsi: Fix incorrect error path labels for flashnode operations NFSD: Fix NFSv3 SETATTR/CREATE's handling of large file sizes NFSD: Fix ia_size underflow Input: synaptics-rmi - fix crash with unsupported versions of F34 Input: synaptics-rmi4 - convert to use sysfs_emit() APIs do_change_type(): refuse to operate on unmounted/not ours mounts net/mlx4_en: Prevent potential integer overflow calculating Hz rtc: Fix offset calculation for .start_secs < 0 rtc: sh: assign correct interrupts with DT perf tests switch-tracking: Fix timestamp comparison mfd: stmpe-spi: Correct the name used in MODULE_DEVICE_TABLE mfd: exynos-lpass: Avoid calling exynos_lpass_disable() twice in exynos_lpass_remove() rpmsg: qcom_smd: Fix uninitialized return variable in __qcom_smd_send() perf ui browser hists: Set actions->thread before calling do_zoom_thread() fbdev: core: fbcvt: avoid division by 0 in fb_cvt_hperiod() soc: aspeed: Add NULL check in aspeed_lpc_enable_snoop() soc: aspeed: lpc: Fix impossible judgment condition arm64: dts: rockchip: disable unrouted USB controllers and PHY on RK3399 Puma with Haikou ARM: dts: qcom: apq8064 merge hw splinlock into corresponding syscon device bus: fsl-mc: fix double-free on mc_dev nilfs2: do not propagate ENOENT error from nilfs_btree_propagate() nilfs2: add pointer check for nilfs_direct_propagate() Squashfs: check return result of sb_min_blocksize ARM: dts: at91: at91sam9263: fix NAND chip selects ARM: dts: at91: usb_a9263: fix GPIO for Dataflash chip select f2fs: fix to correct check conditions in f2fs_cross_rename f2fs: use d_inode(dentry) cleanup dentry->d_inode calipso: Don't call calipso functions for AF_INET sk. net: lan743x: rename lan743x_reset_phy to lan743x_hw_reset_phy wifi: ath9k_htc: Abort software beacon handling if disabled bpf: Fix WARN() in get_bpf_raw_tp_regs pinctrl: at91: Fix possible out-of-boundary access net: ncsi: Fix GCPS 64-bit member variables f2fs: fix to do sanity check on sbi->total_valid_block_count drm/tegra: rgb: Fix the unbound reference count drm: rcar-du: Fix memory leak in rcar_du_vsps_init() selftests/seccomp: fix syscall_restart test for arm compat firmware: psci: Fix refcount leak in psci_dt_init m68k: mac: Fix macintosh_config for Mac II drm/vmwgfx: Add seqno waiter for sync_files ACPI: OSI: Stop advertising support for "3.0 _SCP Extensions" x86/mtrr: Check if fixed-range MTRRs exist in mtrr_save_fixed_ranges() crypto: marvell/cesa - Avoid empty transfer descriptor crypto: marvell/cesa - Handle zero-length skcipher requests x86/cpu: Sanitize CPUID(0x80000000) output perf/core: Fix broken throttling when max_samples_per_tick=1 gfs2: gfs2_create_inode error handling fix netfilter: nft_socket: fix sk refcount leaks thunderbolt: Do not double dequeue a configuration request usb: usbtmc: Fix timeout value in get_stb usb: storage: Ignore UAS driver for SanDisk 3.2 Gen2 storage device usb: quirks: Add NO_LPM quirk for SanDisk Extreme 55AE pinctrl: armada-37xx: set GPIO output value before setting direction pinctrl: armada-37xx: use correct OUTPUT_VAL register for GPIOs > 31 tracing: Fix compilation warning on arm32 platform/x86: thinkpad_acpi: Ignore battery threshold change event notification platform/x86: fujitsu-laptop: Support Lifebook S2110 hotkeys spi: spi-sun4i: fix early activation um: let 'make clean' properly clean underlying SUBARCH as well platform/x86: thinkpad_acpi: Support also NEC Lavie X1475JAS nfs: don't share pNFS DS connections between net namespaces HID: quirks: Add ADATA XPG alpha wireless mouse support coredump: fix error handling for replace_fd() smb: client: Reset all search buffer pointers when releasing buffer smb: client: Fix use-after-free in cifs_fill_dirent drm/i915/gvt: fix unterminated-string-initialization warning netfilter: nf_tables: do not defer rule destruction via call_rcu netfilter: nf_tables: wait for rcu grace period on net_device removal netfilter: nf_tables: pass nft_chain to destroy function, not nft_ctx mm/page_alloc.c: avoid infinite retries caused by cpuset race llc: fix data loss when reading from a socket in llc_ui_recvmsg() ALSA: pcm: Fix race of buffer access at PCM OSS layer can: bcm: add missing rcu read protection for procfs content can: bcm: add locking for bcm_op runtime updates crypto: algif_hash - fix double free in hash_accept net: dwmac-sun8i: Use parsed internal PHY address instead of 1 __legitimize_mnt(): check for MNT_SYNC_UMOUNT should be under mount_lock xenbus: Allow PVH dom0 a non-local xenstore btrfs: correct the order of prelim_ref arguments in btrfs__prelim_ref ASoC: Intel: bytcr_rt5640: Add DMI quirk for Acer Aspire SW3-013 pinctrl: meson: define the pull up/down resistor value as 60 kOhm drm: Add valid clones check regulator: ad5398: Add device tree support bpftool: Fix readlink usage in get_fd_type HID: usbkbd: Fix the bit shift number for LED_KANA scsi: st: Restore some drive settings after reset scsi: lpfc: Handle duplicate D_IDs in ndlp search-by D_ID routine hwmon: (xgene-hwmon) use appropriate type for the latency value ip: fib_rules: Fetch net from fib_rule in fib[46]_rule_configure(). net/mlx5: Extend Ethtool loopback selftest to support non-linear SKB net/mlx4_core: Avoid impossible mlx4_db_alloc() order value smack: recognize ipv4 CIPSO w/o categories pinctrl: devicetree: do not goto err when probing hogs in pinctrl_dt_to_map ASoC: ops: Enforce platform maximum on initial value ACPI: HED: Always initialize before evged PCI: Fix old_size lower bound in calculate_iosize() too EDAC/ie31200: work around false positive build warning net: pktgen: fix access outside of user given buffer in pktgen_thread_write() MIPS: pm-cps: Use per-CPU variables as per-CPU, not per-core MIPS: Use arch specific syscall name match function cpuidle: menu: Avoid discarding useful information x86/nmi: Add an emergency handler in nmi_desc & use it in nmi_shootdown_cpus() bonding: report duplicate MAC address in all situations net: xgene-v2: remove incorrect ACPI_PTR annotation x86/bugs: Make spectre user default depend on MITIGATION_SPECTRE_V2 net: pktgen: fix mpls maximum labels list parsing pinctrl: bcm281xx: Use "unsigned int" instead of bare "unsigned" media: cx231xx: set device_caps for 417 dm cache: prevent BUG_ON by blocking retries on failed device resumes media: c8sectpfe: Call of_node_put(i2c_bus) only once in c8sectpfe_probe() ARM: tegra: Switch DSI-B clock parent to PLLD on Tegra114 ieee802154: ca8210: Use proper setters and getters for bitwise types rtc: ds1307: stop disabling alarms on probe powerpc/prom_init: Fixup missing #size-cells on PowerBook6,7 mmc: sdhci: Disable SD card clock before changing parameters posix-timers: Add cond_resched() to posix_timer_add() search loop xen: Add support for XenServer 6.1 platform device dm: restrict dm device size to 2^63-512 bytes kbuild: fix argument parsing in scripts/config scsi: st: ERASE does not change tape location scsi: st: Tighten the page format heuristics with MODE SELECT ext4: reorder capability check last um: Update min_low_pfn to match changes in uml_reserved um: Store full CSGSFS and SS register from mcontext btrfs: send: return -ENAMETOOLONG when attempting a path that is too long btrfs: avoid linker error in btrfs_find_create_tree_block() i2c: pxa: fix call balance of i2c->clk handling routines mmc: host: Wait for Vdd to settle on card power off pNFS/flexfiles: Report ENETDOWN as a connection error tools/build: Don't pass test log files to linker dql: Fix dql->limit value when reset. SUNRPC: rpc_clnt_set_transport() must not change the autobind setting NFSv4: Treat ENETUNREACH errors as fatal for state recovery fbdev: core: tileblit: Implement missing margin clearing for tileblit fbdev: fsl-diu-fb: add missing device_remove_file() mailbox: use error ret code of of_parse_phandle_with_args() kconfig: merge_config: use an empty file as initfile cgroup: Fix compilation issue due to cgroup_mutex not being exported dma-mapping: avoid potential unused data compilation warning scsi: target: iscsi: Fix timeout on deleted connection openvswitch: Fix unsafe attribute parsing in output_userspace() Input: synaptics - enable InterTouch on TUXEDO InfinityBook Pro 14 v5 Input: synaptics - enable SMBus for HP Elitebook 850 G1 phy: Fix error handling in tegra_xusb_port_init ALSA: es1968: Add error handling for snd_pcm_hw_constraint_pow2() ACPI: PPTT: Fix processor subtable walk qlcnic: fix memory leak in qlcnic_sriov_channel_cfg_cmd() ALSA: sh: SND_AICA should depend on SH_DMA_API spi: loopback-test: Do not split 1024-byte hexdumps RDMA/rxe: Fix slab-use-after-free Read in rxe_queue_cleanup bug staging: axis-fifo: Correct handling of tx_fifo_depth for size validation staging: axis-fifo: avoid parsing ignored device tree properties platform/x86: asus-wmi: Fix wlan_ctrl_by_user detection do_umount(): add missing barrier before refcount checks in sync case MIPS: Fix MAX_REG_OFFSET iio: adc: dln2: Use aligned_s64 for timestamp types: Complement the aligned types with signed 64-bit one USB: usbtmc: use interruptible sleep in usbtmc_read usb: typec: tcpm: delay SNK_TRY_WAIT_DEBOUNCE to SRC_TRYWAIT transition ocfs2: stop quota recovery before disabling quotas ocfs2: implement handshaking with ocfs2 recovery thread ocfs2: switch osb->disable_recovery to enum module: ensure that kobject_put() is safe for module type kobjects xenbus: Use kref to track req lifetime usb: uhci-platform: Make the clock really optional iio: imu: st_lsm6dsx: fix possible lockup in st_lsm6dsx_read_fifo iio: adis16201: Correct inclinometer channel resolution Input: synaptics - enable InterTouch on Dell Precision M3800 Input: synaptics - enable InterTouch on Dynabook Portege X30L-G Input: synaptics - enable InterTouch on Dynabook Portege X30-D net: dsa: b53: fix learning on VLAN unaware bridges scsi: target: Fix WRITE_SAME No Data Buffer crash dm: fix copying after src array boundaries iommu/amd: Fix potential buffer overflow in parse_ivrs_acpihid irqchip/gic-v2m: Add const to of_device_id sch_htb: make htb_qlen_notify() idempotent of: module: add buffer overflow check in of_modalias() net: fec: ERR007885 Workaround for conventional TX lan743x: remove redundant initialization of variable current_head_index net: dlink: Correct endianness handling of led_mode tracing: Fix oob write in trace_seq_to_buffer() dm: always update the array size in realloc_argv on success wifi: brcm80211: fmac: Add error handling for brcmf_usb_dl_writeimage() amd-xgbe: Fix to ensure dependent features are toggled with RX checksum offload i2c: imx-lpi2c: Fix clock count when probe defers EDAC/altera: Set DDR and SDMMC interrupt mask before registration EDAC/altera: Test the correct error reg offset signal/m68k: Use force_sigsegv(SIGSEGV) in fpsp040_die mmc: sdhci: Do not lock spinlock around mmc_gpio_get_ro() x86/bugs: fix backport error in "x86/bugs: Don't fill RSB on VMEXIT with eIBRS+retpoline" x86/bugs: fix backport error in "x86/bugs: Don't fill RSB on VMEXIT with eIBRS+retpoline" CIP: Bump version suffix to -cip121 after merge from cip/linux-4.19.y-st tree Update localversion-st, tree is up-to-date with 5.4.293. x86/bugs: Don't fill RSB on VMEXIT with eIBRS+retpoline clk: check for disabled clock-provider in of_clk_get_hw_from_clkspec() PCI: Rename PCI_IRQ_LEGACY to PCI_IRQ_INTX MIPS: cm: Fix warning if MIPS_CM is disabled comedi: jr3_pci: Fix synchronous deletion of timer scsi: pm80xx: Set phy_attached to zero when device is gone ACPI PPTT: Fix coding mistakes in a couple of sizeof() calls selftests: ublk: fix test_stripe_04 KVM: s390: Don't use %pK through tracepoints sched/isolation: Make CONFIG_CPU_ISOLATION depend on CONFIG_SMP ntb: reduce stack usage in idt_scan_mws qibfs: fix _another_ leak usb: gadget: aspeed: Add NULL pointer check in ast_vhub_init_dev() usb: host: max3421-hcd: Add missing spi_device_id table parisc: PDT: Fix missing prototype warning MIPS: cm: Detect CM quirks from device tree USB: VLI disk crashes if LPM is used usb: quirks: Add delay init quirk for SanDisk 3.2Gen1 Flash Drive usb: quirks: add DELAY_INIT quirk for Silicon Motion Flash Drive usb: dwc3: gadget: check that event count does not exceed event buffer length USB: OHCI: Add quirk for LS7A OHCI controller (rev 0x02) USB: serial: simple: add OWON HDS200 series oscilloscope support USB: serial: option: add Sierra Wireless EM9291 USB: serial: ftdi_sio: add support for Abacus Electrics Optical Probe USB: storage: quirk for ADATA Portable HDD CH94 mcb: fix a double free bug in chameleon_parse_gdd() virtio_console: fix missing byte order handling for cols and rows net_sched: hfsc: Fix a potential UAF in hfsc_dequeue() too net_sched: hfsc: Fix a UAF vulnerability in class handling tipc: fix NULL pointer dereference in tipc_mon_reinit_self() net: phy: leds: fix memory leak cpufreq: scpi: Fix null-ptr-deref in scpi_cpufreq_get_rate() misc: pci_endpoint_test: Fix displaying 'irq_type' after 'request_irq' error misc: pci_endpoint_test: Use INTX instead of LEGACY net: dsa: mv88e6xxx: fix VTU methods for 6320 family ext4: fix OOB read when checking dotdot dir ext4: optimize __ext4_check_dir_entry() MIPS: ds1287: Match ds1287_set_base_clock() function types MIPS: cevt-ds1287: Add missing ds1287.h include MIPS: dec: Declare which_prom() as static virtio-net: Add validation for used length openvswitch: fix lockup on tx to unregistering netdev with carrier net: openvswitch: fix race on port output mmc: cqhci: Fix checking of CQHCI_HALT state nvmet-fc: Remove unused functions usb: dwc3: support continuous runtime PM with dual role misc: pci_endpoint_test: Fix 'irq_type' to convey the correct type misc: pci_endpoint_test: Avoid issue of interrupts remaining after request_irq error tcp/dccp: Don't use timer_pending() in reqsk_queue_unlink(). kbuild: Add '-fno-builtin-wcslen' drm/sti: remove duplicate object names drm/repaper: fix integer overflows in repeat functions module: sign with sha512 instead of sha1 by default isofs: Prevent the use of too small fid i2c: cros-ec-tunnel: defer probe if parent EC is not present hfs/hfsplus: fix slab-out-of-bounds in hfs_bnode_read_key btrfs: correctly escape subvol in btrfs_show_options() nfs: move nfs_fhandle_hash to common include file NFSD: Constify @fh argument of knfsd_fh_hash() asus-laptop: Fix an uninitialized variable writeback: fix false warning in inode_to_wb() net: b53: enable BPDU reception for management port net: openvswitch: fix nested key length validation in the set() action Revert "wifi: mac80211: Update skb's control block key in ieee80211_tx_dequeue()" Bluetooth: btrtl: Prevent potential NULL dereference Bluetooth: hci_event: Fix sending MGMT_EV_DEVICE_FOUND for invalid address RDMA/usnic: Fix passing zero to PTR_ERR in usnic_ib_pci_probe() scsi: iscsi: Fix missing scsi_host_put() in error path wifi: wl1251: fix memory leak in wl1251_tx_work wifi: mac80211: Purge vif txq in ieee80211_do_stop() wifi: mac80211: Update skb's control block key in ieee80211_tx_dequeue() wifi: at76c50x: fix use after free access in at76_disconnect HSI: ssi_protocol: Fix use after free vulnerability in ssi_protocol Driver Due to Race Condition Bluetooth: hci_uart: Fix another race during initialization x86/e820: Fix handling of subpage regions when calculating nosave ranges in e820__register_nosave_regions() PCI: Fix reference leak in pci_alloc_child_bus() of/irq: Fix device node refcount leakages in of_irq_init() of/irq: Fix device node refcount leakage in API irq_of_parse_and_map() gpio: zynq: Fix wakeup source leaks on device unbind ftrace: Add cond_resched() to ftrace_graph_set_hash() crypto: ccp - Fix check for the primary ASP device thermal/drivers/rockchip: Add missing rk3328 mapping entry sctp: detect and prevent references to a freed transport in sendmsg mm: add missing release barrier on PGDAT_RECLAIM_LOCKED unlock sparc/mm: disable preemption in lazy mmu mode arm64: dts: mediatek: mt8173: Fix disp-pwm compatible string mtd: inftlcore: Add error check for inftl_read_oob() lib: scatterlist: fix sg_split_phys to preserve original scatterlist offsets jbd2: remove wrong sb->s_sequence check ext4: fix off-by-one error in do_split media: venus: hfi_parser: add check to avoid out of bound access media: i2c: ov7251: Introduce 1 ms delay between regulators and en GPIO media: i2c: ov7251: Set enable GPIO low in probe media: v4l2-dv-timings: prevent possible overflow in v4l2_detect_gtf() media: streamzap: prevent processing IR data on URB failure mtd: rawnand: brcmnand: fix PM resume warning arm64: cputype: Add MIDR_CORTEX_A76AE xenfs/xensyms: respect hypervisor's "next" indication media: siano: Fix error handling in smsdvb_module_init() media: venus: hfi: add check to handle incorrect queue size media: venus: hfi: add a check to handle OOB in sfr region media: i2c: adv748x: Fix test pattern selection mask bpf: support SKF_NET_OFF and SKF_LL_OFF on skb frags bpf: Add endian modifiers to fix endian warnings fbdev: omapfb: Add 'plane' value check drm/mediatek: mtk_dpi: Explicitly manage TVD clock in power on/off drm/amdkfd: Fix pqm_destroy_queue race with GPU reset drm: allow encoder mode_set even when connectors change for crtc Bluetooth: hci_uart: fix race during initialization tracing: fix return value in __ftrace_event_enable_disable for TRACE_REG_UNREGISTER net: vlan: don't propagate flags on open scsi: st: Fix array overflow in st_setup() ext4: ignore xattrs past end ext4: protect ext4_release_dquot against freezing ahci: add PCI ID for Marvell 88SE9215 SATA Controller ata: libata-eh: Do not use ATAPI DMA for a device limited to PIO mode jfs: add sanity check for agwidth in dbMount jfs: Prevent copying of nlink with value 0 from disk inode fs/jfs: Prevent integer overflow in AG size calculation fs/jfs: cast inactags to s64 to prevent potential overflow ALSA: usb-audio: Fix CME quirk for UF series keyboards ALSA: hda: intel: Fix Optimus when GPU has no sound HID: pidff: Fix null pointer dereference in pidff_find_fields HID: pidff: Do not send effect envelope if it's empty HID: pidff: Convert infinite length from Linux API to PID standard perf: arm_pmu: Don't disable counter in armpmu_add() x86/cpu: Don't clear X86_FEATURE_LAHF_LM flag in init_amd_k8() on AMD when running in a virtual machine pm: cpupower: bench: Prevent NULL dereference on malloc failure net: ppp: Add bound checking for skb data on ppp_sync_txmung ata: sata_sx4: Add error handling in pdc20621_i2c_read() ata: sata_sx4: Drop pointless VPRINTK() calls and convert the remaining ones tipc: fix memory leak in tipc_link_xmit ata: pata_pxa: Fix potential NULL pointer dereference in pxa_ata_probe() CIP: Bump version suffix to -cip120 after merge from cip/linux-4.19.y-st tree Update localversion-st, tree is up-to-date with 5.4.292. net: dsa: mv88e6xxx: propperly shutdown PPU re-enable timer on destroy jfs: add index corruption check to DT_GETPAGE() jfs: fix slab-out-of-bounds read in ea_get() tracing: Fix use-after-free in print_graph_function_flags during tracer switching mmc: sdhci-pxav3: set NEED_RSP_BUSY capability x86/tsc: Always save/restore TSC sched_clock() on suspend/resume ntb_perf: Delete duplicate dmaengine_unmap_put() call in perf_copy_chunk() arcnet: Add NULL check in com20020pci_probe() ipv6: fix omitted netlink attributes when using RTEXT_FILTER_SKIP_STATS vsock: avoid timeout during connect() if the socket is closing net_sched: skbprio: Remove overly strict queue assertions netlabel: Fix NULL pointer exception caused by CALIPSO on IPv4 sockets ntb: intel: Fix using link status DB's ntb_hw_switchtec: Fix shift-out-of-bounds in switchtec_ntb_mw_set_trans spufs: fix a leak in spufs_create_context() spufs: fix a leak on spufs_new_file() failure hwmon: (nct6775-core) Fix out of bounds access for NCT679{8,9} sched/deadline: Use online cpus for validating runtime affs: don't write overlarge OFS data block size fields affs: generate OFS sequence numbers starting at 1 wifi: iwlwifi: fw: allocate chained SG tables for dump sched/smt: Always inline sched_smt_active() ring-buffer: Fix bytes_dropped calculation issue objtool, media: dib8000: Prevent divide-by-zero in dib8000_set_dds() fs/procfs: fix the comment above proc_pid_wchan() perf python: Check if there is space to copy all the event perf python: Decrement the refcount of just created event on failure perf python: Fixup description of sample.id event member ocfs2: validate l_tree_depth to avoid out-of-bounds access perf units: Fix insufficient array space iio: accel: mma8452: Ensure error return on failure to matching oversampling ratio coresight: catu: Fix number of pages while using 64k pages isofs: fix KMSAN uninit-value bug in do_isofs_readdir() x86/dumpstack: Fix inaccurate unwinding from exception stacks due to misplaced assignment mfd: sm501: Switch to BIT() to mitigate integer overflows RDMA/mlx5: Fix mlx5_poll_one() cur_qp update flow power: supply: max77693: Fix wrong conversion of charge input threshold value x86/entry: Fix ORC unwinder for PUSH_REGS with save_ret=1 IB/mad: Check available slots before posting receive WRs clk: rockchip: rk3328: fix wrong clk_ref_usb3otg parent lib: 842: Improve error handling in sw842_compress() clk: amlogic: gxbb: drop incorrect flag on 32k clock fbdev: sm501fb: Add some geometry checks. mdacon: rework dependency list fbdev: au1100fb: Move a variable assignment behind a null pointer check PCI/portdrv: Only disable pciehp interrupts early when needed ALSA: hda/realtek: Always honor no_shutup_pins perf/ring_buffer: Allow the EPOLLRDNORM flag for poll lockdep: Don't disable interrupts on RT in disable_irq_nosync_lockdep.*() thermal: int340x: Add NULL check for adev EDAC/ie31200: Fix the error path order of ie31200_init() EDAC/ie31200: Fix the DIMM size mask for several SoCs x86/fpu: Avoid copying dynamic FP state from init_task in arch_dup_task_struct() cpufreq: governor: Fix negative 'idle_time' handling in dbs_update() net: usb: usbnet: restore usb%d name exception for local mac addresses net: usb: qmi_wwan: add Telit Cinterion FE990B composition net: usb: qmi_wwan: add Telit Cinterion FN990B composition tty: serial: 8250: Add some more device IDs netfilter: socket: Lookup orig tuple for IPv6 SNAT ARM: 9351/1: fault: Add "cut here" line for prefetch aborts ARM: 9350/1: fault: Implement copy_from_kernel_nofault_allowed() atm: Fix NULL pointer dereference ALSA: usb-audio: Add quirk for Plantronics headsets to fix control names drm/radeon: fix uninitialized size issue in radeon_vce_cs_parse() batman-adv: Ignore own maximum aggregation size during RX ARM: shmobile: smp: Enforce shmobile_smp_* alignment mmc: atmel-mci: Add missing clk_disable_unprepare() net/neighbor: add missing policy for NDTPA_QUEUE_LENBYTES net: atm: fix use after free in lec_send() Bluetooth: Fix error code in chan_alloc_skb_cb() RDMA/hns: Fix wrong value of max_sge_rd RDMA/bnxt_re: Avoid clearing VLAN_ID mask in modify qp path xfrm_output: Force software GSO only in tunnel mode i2c: sis630: Fix an error handling path in sis630_probe() i2c: ali15x3: Fix an error handling path in ali15x3_probe() i2c: ali1535: Fix an error handling path in ali1535_probe() ASoC: codecs: wm0010: Fix error handling path in wm0010_spi_probe() drm/gma500: Add NULL check for pci_gfx_root in mid_get_vbt_data() qlcnic: fix memory leak issues in qlcnic_sriov_common.c drm/amd/display: Assign normalized_pix_clk when color depth = 14 x86/microcode/AMD: Fix out-of-bounds on systems with CPU-less NUMA nodes USB: serial: option: match on interface class for Telit FN990B USB: serial: option: fix Telit Cinterion FE990A name USB: serial: option: add Telit Cinterion FE990B compositions USB: serial: ftdi_sio: add support for Altera USB Blaster 3 block: fix 'kmem_cache of name 'bio-108' already exists' drm/nouveau: Do not override forced connector status x86/irq: Define trace events conditionally nvme: only allow entering LIVE from CONNECTING state sctp: Fix undefined behavior in left shift operation nvmet-rdma: recheck queue state is LIVE in state lock in recv done s390/cio: Fix CHPID "configure" attribute caching HID: ignore non-functional sensor in HP 5MP Camera iscsi_ibft: Fix UBSAN shift-out-of-bounds warning in ibft_attr_show_nic() powercap: call put_device() on an error path in powercap_register_control_type() nvme-fc: go straight to connecting state when initializing net_sched: Prevent creation of classes with TC_H_ROOT ipvs: prevent integer overflow in do_ip_vs_get_ctl() netfilter: nf_conncount: Fully initialize struct nf_conncount_tuple in insert_tree() Drivers: hv: vmbus: Don't release fb_mmio resource in vmbus_free_mmio() drivers/hv: Replace binary semaphore with mutex netpoll: hold rcu read lock in __netpoll_send_skb() netpoll: netpoll_send_skb() returns transmit status netpoll: move netpoll_send_skb() out of line netpoll: remove dev argument from netpoll_send_skb_on_dev() netpoll: Fix use correct return type for ndo_start_xmit() pinctrl: bcm281xx: Fix incorrect regmap max_registers value sctp: sysctl: auth_enable: avoid using current->nsproxy sctp: sysctl: cookie_hmac_alg: avoid using current->nsproxy Revert "sctp: sysctl: auth_enable: avoid using current->nsproxy" Revert "sctp: sysctl: cookie_hmac_alg: avoid using current->nsproxy" sched/isolation: Prevent boot crash when the boot CPU is nohz_full CIP: Bump version suffix to -cip119 after merge from cip/linux-4.19.y-st tree watchdog: renesas_wdt: support handover from bootloader Update localversion-st, tree is up-to-date with 5.4.291. gtp: Suppress list corruption splat in gtp_net_exit_batch_rtnl(). gtp: Destroy device along with udp socket's netns dismantle. net: gso: fix ownership in __udp_gso_segment vlan: fix memory leak in vlan_newlink() batman-adv: Drop unmanaged ELP metric worker tee: optee: Fix supplicant wait loop pps: Fix a use-after-free net: rose: lock the socket in rose_bind() btrfs: fix use-after-free when attempting to join an aborted transaction media: lmedm04: Handle errors for lme2510_int_read wifi: rtlwifi: rtl8192se: rise completion of firmware loading as last step eeprom: digsy_mtc: Make GPIO lookup table match the device slimbus: messaging: Free transaction ID in delayed interrupt scenario intel_th: pci: Add Panther Lake-P/U support intel_th: pci: Add Panther Lake-H support intel_th: pci: Add Arrow Lake support Squashfs: check the inode number is not the invalid value of zero xhci: pci: Fix indentation in the PCI device ID definitions usb: gadget: Check bmAttributes only if configuration is valid usb: gadget: Fix setting self-powered state on suspend usb: gadget: Set self-powered based on MaxPower and bmAttributes usb: typec: tcpci_rt1711h: Unmask alert interrupts to fix functionality usb: typec: ucsi: increase timeout for PPM reset operations usb: atm: cxacru: fix a flaw in existing endpoint checks usb: quirks: Add DELAY_INIT and NO_LPM for Prolific Mass Storage Card Reader usb: renesas_usbhs: Use devm_usb_get_phy() Revert "drivers/card_reader/rtsx_usb: Restore interrupt based detection" net: ipv6: fix missing dst ref drop in ila lwtunnel net: ipv6: fix dst ref loop in ila lwtunnel net-timestamp: support TCP GSO case for a few missing flags vlan: enforce underlying device type ppp: Fix KMSAN uninit-value warning with bpf be2net: fix sleeping while atomic bugs in be_ndo_bridge_getlink hwmon: fix a NULL vs IS_ERR_OR_NULL() check in xgene_hwmon_probe() llc: do not use skb_get() before dev_queue_xmit() hwmon: (ad7314) Validate leading zero bits and return error hwmon: (ntc_thermistor) Fix the ncpXXxh103 sensor table hwmon: (pmbus) Initialise page count in pmbus_identify() caif_virtio: fix wrong pointer check in cfv_probe() HID: intel-ish-hid: Fix use-after-free issue in ishtp_hid_remove() mm/page_alloc: fix uninitialized variable rapidio: fix an API misues when rio_add_net() fails rapidio: add check for rio_add_net() in rio_scan_alloc_net() wifi: nl80211: reject cooked mode if it is set along with other flags wifi: cfg80211: regulatory: improve invalid hints checking x86/cpu: Properly parse CPUID leaf 0x2 TLB descriptor 0x63 x86/cpu: Validate CPUID leaf 0x2 EDX output x86/cacheinfo: Validate CPUID leaf 0x2 EDX output platform/x86: thinkpad_acpi: Add battery quirk for ThinkPad X131e drm/radeon: Fix rs400_gpu_init for ATI mobility radeon Xpress 200M ALSA: hda/realtek: update ALC222 depop optimize ALSA: hda: intel: Add Dell ALC3271 to power_save denylist HID: appleir: Fix potential NULL dereference at raw event handle Revert "of: reserved-memory: Fix using wrong number of cells to get property 'alignment'" drm/amdgpu: disable BAR resize on Dell G5 SE drm/amdgpu: Check extended configuration space register when system uses large bar drm/amdgpu: skip BAR resizing if the bios already did it acct: perform last write from workqueue kernel/acct.c: use dedicated helper to access rlimit values kernel/acct.c: use #elif instead of #end and #elif pfifo_tail_enqueue: Drop new packet when sch->limit == 0 sched/core: Prevent rescheduling when interrupts are disabled phy: exynos5-usbdrd: fix MPLL_MULTIPLIER and SSC_REFCLKSEL masks in refclk usbnet: gl620a: fix endpoint checking in genelink_bind() perf/core: Fix low freq setting via IOC_PERIOD ftrace: Avoid potential division by zero in function_stat_show() x86/CPU: Fix warm boot hang regression on AMD SC1100 SoC systems ipvs: Always clear ipvs_property flag in skb_scrub_packet() ASoC: es8328: fix route from DAC to output net: cadence: macb: Synchronize stats calculations sunrpc: suppress warnings for unused procfs functions batman-adv: Ignore neighbor throughput metrics in error case acct: block access to kernel internal filesystems ALSA: hda/conexant: Add quirk for HP ProBook 450 G4 mute LED nfp: bpf: Add check for nfp_app_ctrl_msg_alloc() power: supply: da9150-fg: fix potential overflow geneve: Suppress list corruption splat in geneve_destroy_tunnels(). geneve: Fix use-after-free in geneve_find_dev(). powerpc/code-patching: Fix KASAN hit by not flagging text patching area as VM_ALLOC ALSA: hda/realtek - Add type for ALC287 powerpc/64s: Rewrite __real_pte() and __rpte_to_hidx() as static inline powerpc/64s/mm: Move __real_pte stubs into hash-4k.h USB: gadget: f_midi: f_midi_complete to call queue_work usb/gadget: f_midi: Replace tasklet with work usb/gadget: f_midi: convert tasklets to use new tasklet_setup() API usb: dwc3: Fix timeout issue during controller enter/exit from halt state mm: update mark_victim tracepoints fields crypto: testmgr - some more fixes to RSA test vectors crypto: testmgr - populate RSA CRT parameters in RSA test vectors crypto: testmgr - fix version number of RSA tests crypto: testmgr - Fix wrong test case of RSA crypto: testmgr - fix wrong key length for pkcs1pad driver core: bus: Fix double free in driver API bus_register() scsi: storvsc: Set correct data length for sending SCSI command without payload vlan: move dev_put into vlan_dev_uninit vlan: introduce vlan_dev_free_egress_priority Revert "btrfs: avoid monopolizing a core when activating a swap file" parport_pc: add support for ASIX AX99100 can: ems_pci: move ASIX AX99100 ids to pci_ids.h nilfs2: protect access to buffers with no active references nilfs2: do not force clear folio if buffer is referenced nilfs2: do not output warnings when clearing dirty buffers alpha: replace hardcoded stack offsets with autogenerated ones ndisc: extend RCU protection in ndisc_send_skb() openvswitch: use RCU protection in ovs_vport_cmd_fill_info() arp: use RCU protection in arp_xmit() neighbour: use RCU protection in __neigh_notify() neighbour: delete redundant judgment statements ndisc: use RCU protection in ndisc_alloc_skb() ipv6: use RCU protection in ip6_default_advmss() ipv4: use RCU protection in inet_select_addr() ipv4: use RCU protection in rt_is_expired() net: add dev_net_rcu() helper net: treat possible_net_t net pointer as an RCU one and add read_pnet_rcu() partitions: mac: fix handling of bogus partition table gpio: stmpe: Check return value of stmpe_reg_read in stmpe_gpio_irq_sync_unlock alpha: align stack for page fault and user unaligned trap handlers alpha: make stack 16-byte aligned (most cases) can: c_can: fix unbalanced runtime PM disable in error path USB: serial: option: drop MeiG Smart defines USB: serial: option: fix Telit Cinterion FN990A name USB: serial: option: add Telit Cinterion FN990B compositions USB: serial: option: add MeiG Smart SLM828 usb: cdc-acm: Fix handling of oversized fragments usb: cdc-acm: Check control transfer buffer size before access USB: cdc-acm: Fill in Renesas R-Car D3 USB Download mode quirk USB: hub: Ignore non-compliant devices with too many configs or interfaces usb: gadget: f_midi: fix MIDI Streaming descriptor lengths USB: Add USB_QUIRK_NO_LPM quirk for sony xperia xz1 smartphone USB: quirks: add USB_QUIRK_NO_LPM quirk for Teclast dist USB: pci-quirks: Fix HCCPARAMS register error for LS7A EHCI usb: dwc2: gadget: remove of_node reference upon udc_stop usb: gadget: udc: renesas_usb3: Fix compiler warning usb: roles: set switch registered flag early on batman-adv: fix panic during interface removal ASoC: Intel: bytcr_rt5640: Add DMI quirk for Vexia Edu Atla 10 tablet 5V orangefs: fix a oob in orangefs_debug_write Grab mm lock before grabbing pt lock vfio/pci: Enable iowrite64 and ioread64 for vfio pci media: cxd2841er: fix 64-bit division on gcc-9 xen: remove a confusing comment on auto-translated guest I/O gpio: bcm-kona: Add missing newline to dev_err format string gpio: bcm-kona: Fix GPIO lock/unlock for banks above bank 0 arm64: cacheinfo: Avoid out-of-bounds write to cacheinfo array team: better TEAM_OPTION_TYPE_STRING validation vrf: use RCU protection in l3mdev_l3_out() ndisc: ndisc_send_redirect() must use dev_get_by_index_rcu() HID: multitouch: Add NULL check in mt_input_configured ocfs2: check dir i_size in ocfs2_find_entry MIPS: ftrace: Declare ftrace_get_parent_ra_addr() as static ptp: Ensure info->enable callback is always set mtd: onenand: Fix uninitialized retlen in do_otp_read() NFC: nci: Add bounds checking in nci_hci_create_pipe() nilfs2: fix possible int overflows in nilfs_fiemap() ocfs2: handle a symlink read error correctly ocfs2: fix incorrect CPU endianness conversion causing mount failure nvmem: core: improve range check for nvmem_cell_write() crypto: qce - fix goto jump in error path media: uvcvideo: Remove redundant NULL assignment media: uvcvideo: Fix event flags in uvc_ctrl_send_events media: ov5640: fix get_light_freq on auto soc: qcom: smem_state: fix missing of_node_put in error path powerpc/pseries/eeh: Fix get PE state translation serial: sh-sci: Do not probe the serial port if its slot in sci_ports[] is in use serial: sh-sci: Drop __initdata macro for port_cfg usb: gadget: f_tcm: Don't prepare BOT write request twice usb: gadget: f_tcm: ep_autoconfig with fullspeed endpoint usb: gadget: f_tcm: Decrement command ref count on cleanup usb: gadget: f_tcm: Translate error to sense wifi: brcmfmac: fix NULL pointer dereference in brcmf_txfinalize() HID: hid-sensor-hub: don't use stale platform-data on remove of: reserved-memory: Fix using wrong number of cells to get property 'alignment' of: Fix of_find_node_opts_by_path() handling of alias+path+options of: Correct child specifier used as input of the 2nd nexus node clk: qcom: clk-alpha-pll: fix alpha mode configuration Bluetooth: L2CAP: handle NULL sock pointer in l2cap_sock_alloc KVM: s390: vsie: fix some corner-cases when grabbing vsie pages KVM: Explicitly verify target vCPU is online in kvm_get_vcpu() arm64: dts: rockchip: increase gmac rx_delay on rk3399-puma binfmt_flat: Fix integer overflow bug on 32 bit systems m68k: vga: Fix I/O defines s390/futex: Fix FUTEX_OP_ANDN implementation leds: lp8860: Write full EEPROM, not only half of it cpufreq: s3c64xx: Fix compilation warning tun: revert fix group permission check netem: Update sch->q.qlen before qdisc_tree_reduce_backlog() udp: gso: do not drop small packets when PMTU reduces tg3: Disable tg3 PCIe AER on system reboot firmware: iscsi_ibft: fix ISCSI_IBFT Kconfig entry nvme: handle connectivity loss in nvme_set_queue_count usb: xhci: Fix NULL pointer dereference on certain command aborts usb: xhci: Add timeout argument in address_device USB HCD callback media: uvcvideo: Remove dangling pointers media: uvcvideo: Only save async fh if success nilfs2: handle errors that nilfs_prepare_chunk() may return nilfs2: eliminate staggered calls to kunmap in nilfs_rename nilfs2: move page release outside of nilfs_delete_entry and nilfs_set_link x86/mm: Don't disable PCID when INVLPG has been fixed by microcode HID: Wacom: Add PCI Wacom device support mfd: lpc_ich: Add another Gemini Lake ISA bridge PCI device-id wifi: brcmsmac: add gain range check to wlc_phy_iqcal_gainparams_nphy() mmc: core: Respect quirk_max_rate for non-UHS SDIO card tun: fix group permission check printk: Fix signed integer overflow when defining LOG_BUF_LEN_MAX sched: Don't try to catch up excess steal time. btrfs: convert BUG_ON in btrfs_reloc_cow_block() to proper error handling btrfs: output the reason for open_ctree() failure usb: gadget: f_tcm: Don't free command immediately media: uvcvideo: Fix double free in error path usb: typec: tcpm: set SRC_SEND_CAPABILITIES timeout to PD_T_SENDER_RESPONSE drivers/card_reader/rtsx_usb: Restore interrupt based detection ktest.pl: Check kernelrelease return in get_version NFSD: Reset cb_seq_status after NFS4ERR_DELAY hexagon: Fix unbalanced spinlock in die() hexagon: fix using plain integer as NULL pointer warning in cmpxchg genksyms: fix memory leak when the same symbol is read from *.symref file genksyms: fix memory leak when the same symbol is added from source net: sh_eth: Fix missing rtnl lock in suspend/resume path vsock: Allow retrying on connect() failure net: davicom: fix UAF in dm9000_drv_remove net: rose: fix timer races against user threads PM: hibernate: Add error handling for syscore_suspend() net: fec: implement TSO descriptor cleanup ubifs: skip dumping tnc tree when zroot is null dmaengine: ti: edma: fix OF node reference leaks in edma_driver module: Extend the preempt disabled section in dereference_symbol_descriptor(). ocfs2: mark dquot as inactive if failed to start trans while releasing dquot scsi: mpt3sas: Set ioc->manu_pg11.EEDPTagMode directly to 1 media: camif-core: Add check for clk_enable() media: mipi-csis: Add check for clk_enable() PCI: endpoint: Destroy the EPC device in devm_pci_epc_destroy() media: rc: iguanair: handle timeouts fbdev: omapfb: Fix an OF node leak in dss_of_port_get_parent_device() ARM: dts: mediatek: mt7623: fix IR nodename arm64: dts: mediatek: mt8173-evb: Fix MT6397 PMIC sub-node names arm64: dts: mediatek: mt8173-evb: Drop regulator-compatible property rdma/cxgb4: Prevent potential integer overflow on 32bit RDMA/mlx4: Avoid false error about access to uninitialized gids array perf report: Fix misleading help message about --demangle perf top: Don't complain about lack of vmlinux when not resolving some kernel samples padata: fix sysfs store callback check ktest.pl: Remove unused declarations in run_bisect_test function net: sched: Disallow replacing of child qdisc from one parent to another net/mlxfw: Drop hard coded max FW flash image size selftests: harness: fix printing of mismatch values in __EXPECT() selftests/harness: Display signed values correctly wifi: wlcore: fix unbalanced pm_runtime calls regulator: of: Implement the unwind path of of_regulator_match() team: prevent adding a device which is already a team device lower cpupower: fix TSC MHz calculation wifi: rtlwifi: pci: wait for firmware loading before releasing memory wifi: rtlwifi: fix memory leaks and invalid access at probe error path wifi: rtlwifi: remove unused dualmac control leftovers rtlwifi: replace usage of found with dedicated list iterator variable wifi: rtlwifi: usb: fix workqueue leak when probe fails wifi: rtlwifi: do not complete firmware loading needlessly drm/amdgpu: Fix potential NULL pointer dereference in atomctrl_get_smc_sclk_range_table drm/etnaviv: Fix page property being used for non writecombine buffers afs: Fix directory format encoding struct overflow: Allow mixed type arguments overflow: Correct check_shl_overflow() comment overflow: Add __must_check attribute to check_*() helpers udf: Fix use of check_add_overflow() with mixed type arguments CIP: Bump version suffix to -cip118 after merge from cip/linux-4.19.y-st tree Update localversion-st, tree is up-to-date with 5.4.290. gtp: Use for_each_netdev_rcu() in gtp_genl_dump_pdp(). arm64: dts: rockchip: add hevc power domain clock to rk3328 Partial revert of xhci: use pm_ptr() instead #ifdef for CONFIG_PM conditionals xhci: use pm_ptr() instead of #ifdef for CONFIG_PM conditionals Input: xpad - add support for wooting two he (arm) Input: xpad - add unofficial Xbox 360 wireless receiver clone Input: atkbd - map F23 key to support default copilot shortcut Revert "usb: gadget: u_serial: Disable ep before setting port to null to fix the crash caused by port being null" USB: serial: quatech2: fix null-ptr-deref in qt2_process_read_urb() vfio/platform: check the bounds of read/write syscalls net/xen-netback: prevent UAF in xenvif_flush_hash() m68k: Add missing mmap_read_lock() to sys_cacheflush() m68k: Update ->thread.esp0 before calling syscall_trace() in ret_from_signal gfs2: Truncate address space when flipping GFS2_DIF_JDATA flag irqchip/sunxi-nmi: Add missing SKIP_WAKE flag scsi: iscsi: Fix redundant response for ISCSI_UEVENT_GET_HOST_STATS request ASoC: wm8994: Add depends on MFD core net: fix data-races around sk->sk_forward_alloc scsi: sg: Fix slab-use-after-free read in sg_release() ipv6: avoid possible NULL deref in rt6_uncached_list_flush_dev() irqchip/gic-v3: Handle CPU_PM_ENTER_FAILED correctly fs/proc: fix softlockup in __read_vmcore (part 2) poll_wait: add mb() to fix theoretical race between waitqueue_active() and .poll() hfs: Sanity check the root record mac802154: check local interfaces before deleting sdata list i2c: mux: demux-pinctrl: check initial mux selection, too nfp: bpf: prevent integer overflow in nfp_bpf_event_output() gtp: use exit_batch_rtnl() method net: add exit_batch_rtnl() method net: net_namespace: Optimize the code net: ethernet: ti: cpsw_ale: Fix cpsw_ale_get_field() sctp: sysctl: rto_min/max: avoid using current->nsproxy ocfs2: fix slab-use-after-free due to dangling pointer dqi_priv ocfs2: correct return value of ocfs2_local_free_info() phy: core: Fix that API devm_of_phy_provider_unregister() fails to unregister the phy provider phy: core: fix code style in devm_of_phy_provider_unregister arm64: dts: rockchip: fix pd_tcpc0 and pd_tcpc1 node position on rk3399 arm64: dts: rockchip: fix defines in pd_vio node for rk3399 iio: inkern: call iio_device_put() only on mapped devices iio: adc: at91: call input_free_device() on allocated iio_dev iio: adc: ti-ads8688: fix information leak in triggered buffer iio: imu: kmx61: fix information leak in triggered buffer iio: dummy: iio_simply_dummy_buffer: fix information leak in triggered buffer iio: pressure: zpa2326: fix information leak in triggered buffer usb: gadget: f_fs: Remove WARN_ON in functionfs_bind usb: fix reference leak in usb_new_device() USB: usblp: return error when setting unsupported protocol usb: gadget: u_serial: Disable ep before setting port to null to fix the crash caused by port being null USB: serial: cp210x: add Phoenix Contact UPS Device usb-storage: Add max sectors quirk for Nokia 208 staging: iio: ad9832: Correct phase range check staging: iio: ad9834: Correct phase range check USB: serial: option: add Neoway N723-EA support USB: serial: option: add MeiG Smart SRM815 drm/amd/display: Add check for granularity in dml ceil/floor helpers sctp: sysctl: auth_enable: avoid using current->nsproxy sctp: sysctl: cookie_hmac_alg: avoid using current->nsproxy dm thin: make get_first_thin use rcu-safe list first function tcp/dccp: allow a connection when sk_max_ack_backlog is zero tcp/dccp: complete lockless accesses to sk->sk_max_ack_backlog net: 802: LLC+SNAP OID:PID lookup on start of skb data ieee802154: ca8210: Add missing check for kfifo_alloc() in ca8210_probe() dm array: fix cursor index when skipping across block boundaries dm array: fix unreleased btree blocks on closing a faulty array cursor dm array: fix releasing a faulty array block twice in dm_array_cursor_end jbd2: flush filesystem device before updating tail sequence ravb: Fix use-after-free issue in ravb_tx_timeout_work() net/sched: netem: fix backport of "account for backlog updates from child qdisc" CIP: Bump version suffix to -cip117 after merge from cip/linux-4.19.y-st tree Update localversion-st, tree is up-to-date with 5.4.289. RDMA/bnxt_re: Fix max_qp_wrs reported net/sched: netem: account for backlog updates from child qdisc net/sched: cbs: Fix integer overflow in cbs_set_port_rate() netfilter: nft_set_hash: skip duplicated elements pending gc run drm/etnaviv: flush shader L1 cache after user commandstream usb: yurex: make waiting on yurex_write interruptible perf trace: Avoid garbage when not printing a syscall's arguments scsi: qedf: Fix a possible memory leak in qedf_alloc_and_init_sb() mfd: intel_soc_pmic_bxtwc: Use IRQ domain for PMIC devices mfd: intel_soc_pmic_bxtwc: Use IRQ domain for TMU device mm: vmscan: account for free pages to prevent infinite Loop in throttle_direct_reclaim() drm: adv7511: Drop dsi single lane support net/sctp: Prevent autoclose integer overflow in sctp_association_init() sky2: Add device ID 11ab:4373 for Marvell 88E8075 pinctrl: mcp23s08: Fix sleeping in atomic context due to regmap locking modpost: fix the missed iteration for the max bit in do_input() modpost: fix input MODULE_DEVICE_TABLE() built for 64-bit on 32-bit host irqchip/gic: Correct declaration of *percpu_base pointer in union gic_base net: usb: qmi_wwan: add Telit FE910C04 compositions sound: usb: format: don't warn that raw DSD is unsupported wifi: mac80211: wake the queues in case of failure in resume ila: serialize calls to nf_register_net_hooks() af_packet: fix vlan_get_protocol_dgram() vs MSG_PEEK af_packet: fix vlan_get_tci() vs MSG_PEEK ALSA: usb-audio: US16x08: Initialize array before use net: llc: reset skb->transport_header netrom: check buffer length before accessing it drm/bridge: adv7511_audio: Update Audio InfoFrame properly drm: bridge: adv7511: Enable SPDIF DAI RDMA/bnxt_re: Fix reporting hw_ver in query_device RDMA/bnxt_re: Add check for path mtu in modify_qp Drivers: hv: util: Avoid accessing a ringbuffer not initialized yet selinux: ignore unknown extended permissions btrfs: avoid monopolizing a core when activating a swap file tracing: Constify string literal data member in struct trace_event_call MIPS: Probe toolchain support of -msym32 virtio-blk: don't keep queue frozen during system suspend platform/x86: asus-nb-wmi: Ignore unknown event 0xCF regmap: Use correct format specifier for logging range errors scsi: qla1280: Fix hw revision numbering for ISP1020/1040 tracing/kprobe: Make trace_kprobe's module callback called after jump_label update mtd: rawnand: fix double free in atmel_pmecc_create_user() dmaengine: at_xdmac: avoid null_prt_deref in at_xdmac_prep_dma_memset dmaengine: mv_xor: fix child node refcount handling in early exit phy: core: Fix that API devm_phy_destroy() fails to destroy the phy phy: core: Fix that API devm_phy_put() fails to release the phy phy: core: Fix an OF node refcount leakage in of_phy_provider_lookup() phy: core: Fix an OF node refcount leakage in _of_phy_get() mtd: diskonchip: Cast an operand to prevent potential overflow nfsd: restore callback functionality for NFSv4.0 bpf: Check negative offsets in __bpf_skb_min_len() media: dvb-frontends: dib3000mb: fix uninit-value in dib3000_write_reg of: Fix error path in of_parse_phandle_with_args_map() nilfs2: prevent use of deleted inode of/irq: Fix using uninitialized variable @addr_len in API of_irq_parse_one() NFS/pnfs: Fix a live lock between recalled layouts and layoutget zram: refuse to use zero sized block device as backing device sh: clk: Fix clk_enable() to return 0 on NULL clk USB: serial: option: add Telit FE910C04 rmnet compositions USB: serial: option: add MediaTek T7XX compositions USB: serial: option: add Netprisma LCUK54 modules for WWAN Ready USB: serial: option: add MeiG Smart SLM770A USB: serial: option: add TCL IK512 MBIM & ECM efivarfs: Fix error on non-existent file i2c: riic: Always round-up when calculating bus period chelsio/chtls: prevent potential integer overflow on 32bit mmc: sdhci-tegra: Remove SDHCI_QUIRK_BROKEN_ADMA_ZEROLEN_DESC quirk netfilter: ipset: Fix for recursive locking warning net: ethernet: bgmac-platform: fix an OF node reference leak net: hinic: Fix cleanup in create_rxqs/txqs() net/smc: check sndbuf_space again after NOSPACE flag is set in smc_poll i2c: pnx: Fix timeout in wait functions PCI: Add ACS quirk for Broadcom BCM5760X NIC ALSA: usb: Fix UBSAN warning in parse_audio_unit() PCI/AER: Disable AER service on suspend net: sched: fix ordering of qlen adjustment ALSA: usb-audio: Fix a DMA to stack memory bug xen/netfront: fix crash when removing device KVM: arm64: Ignore PMCNTENSET_EL0 while checking for overflow status qca_spi: Make driver probing reliable ACPI: resource: Fix memory resource type union access net: lapb: increase LAPB_HEADER_LEN batman-adv: Do not let TT changes list grows indefinitely batman-adv: Remove uninitialized data in full table TT response batman-adv: Do not send uninitialized TT changes usb: gadget: u_serial: Fix the issue that gs_start_io crashed due to accessing null pointer usb: ehci-hcd: fix call balance of clocks handling routines usb: dwc2: hcd: Fix GetPortStatus & SetPortFeature ata: sata_highbank: fix OF node reference leak in highbank_initialize_phys() usb: host: max3421-hcd: Correctly abort a USB request. bpf, xdp: Update devmap comments to reflect napi/rcu usage ALSA: usb-audio: Fix out of bounds reads when finding clock sources PCI: rockchip-ep: Fix address translation unit programming Revert "drm/amdgpu: add missing size check in amdgpu_debugfs_gprwave_read()" modpost: Add .irqentry.text to OTHER_SECTIONS ocfs2: Revert "ocfs2: fix the la space leak when unmounting an ocfs2 volume" jffs2: Fix rtime decompressor jffs2: Prevent rtime decompress memory corruption KVM: arm64: vgic-its: Clear ITE when DISCARD frees an ITE KVM: arm64: vgic-its: Clear DTE when MAPD unmaps a device KVM: arm64: vgic-its: Add a data length check in vgic_its_save_* misc: eeprom: eeprom_93cx6: Add quirk for extra read clock cycle powerpc/prom_init: Fixup missing powermac #size-cells usb: chipidea: udc: handle USB Error Interrupt if IOC not set PCI: Add 'reset_subordinate' to reset hierarchy below bridge nvdimm: rectify the illogical code within nd_dax_probe() scsi: st: Add MTIOCGET and MTLOAD to ioctls allowed after device reset scsi: st: Don't modify unknown block number in MTIOCGET leds: class: Protect brightness_show() with led_cdev->led_access mutex tracing: Use atomic64_inc_return() in trace_clock_counter() netpoll: Use rcu_access_pointer() in __netpoll_setup rocker: fix link status detection in rocker_carrier_init() ASoC: hdmi-codec: reorder channel allocation list wifi: brcmfmac: Fix oops due to NULL pointer dereference in brcmf_sdiod_sglist_rw() wifi: ipw2x00: libipw_rx_any(): fix bad alignment jfs: add a check to prevent array-index-out-of-bounds in dbAdjTree jfs: fix array-index-out-of-bounds in jfs_readdir jfs: fix shift-out-of-bounds in dbSplit jfs: array-index-out-of-bounds fix in dtReadFirst wifi: ath5k: add PCI ID for Arcadyan devices wifi: ath5k: add PCI ID for SX76X net: inet6: do not leave a dangling sk pointer in inet6_create() net: inet: do not leave a dangling sk pointer in inet_create() net: ieee802154: do not leave a dangling sk pointer in ieee802154_create() net: af_can: do not leave a dangling sk pointer in can_create() Bluetooth: L2CAP: do not leave dangling sk pointer on error in l2cap_sock_create() af_packet: avoid erroring out after sock_init_data() in packet_create() net: ethernet: fs_enet: Use %pa to format resource_size_t net: fec_mpc52xx_phy: Use %pa to format resource_size_t samples/bpf: Fix a resource leak drm/radeon/r600_cs: Fix possible int overflow in r600_packet3_check() media: cx231xx: Add support for Dexatek USB Video Grabber 1d19:6108 media: uvcvideo: Add a quirk for the Kaiweets KTI-W02 infrared camera s390/cpum_sf: Handle CPU hotplug remove during sampling regmap: detach regmap from dev on regmap_exit bcache: revert replacing IS_ERR_OR_NULL with IS_ERR again nilfs2: fix potential out-of-bounds memory access in nilfs_find_entry() scsi: qla2xxx: Remove check req_sg_cnt should be equal to rsp_sg_cnt scsi: qla2xxx: Supported speed displayed incorrectly for VPorts ocfs2: update seq_file index in ocfs2_dlm_seq_next tracing: Fix cmp_entries_dup() to respect sort() comparison rules HID: wacom: fix when get product name maybe null pointer bpf: Fix exact match conditions in trie_get_next_key() bpf: Handle BPF_EXIST and BPF_NOEXIST for LPM trie ocfs2: free inode when ocfs2_get_init_inode() fails spi: mpc52xx: Add cancel_work_sync before module remove drm/sti: Add __iomem for mixer_dbg_mxn's parameter gpio: grgpio: Add NULL check in grgpio_probe gpio: grgpio: use a helper variable to store the address of ofdev->dev crypto: x86/aegis128 - access 32-bit arguments as 32-bit x86/asm: Reorder early variables xen: Fix the issue of resource not being properly released in xenbus_dev_probe() xen/xenbus: fix locking xenbus/backend: Protect xenbus callback with lock xenbus/backend: Add memory pressure handler callback xen/xenbus: reference count registered modules netfilter: ipset: Hold module reference while requesting a module igb: Fix potential invalid memory access in igb_init_module() net/qed: allow old cards not supporting "num_images" to work dccp: Fix memory leak in dccp_feat_change_recv net/ipv6: release expired exception dst cached in socket netfilter: x_tables: fix LED ID check in led_tg_check() ipvs: fix UB due to uninitialized stack access in ip_vs_protocol_init() can: sun4i_can: sun4i_can_err(): fix {rx,tx}_errors statistics can: sun4i_can: sun4i_can_err(): call can_change_state() even if cf is NULL watchdog: mediatek: Make sure system reset gets asserted in mtk_wdt_restart() nfsd: fix nfs4_openowner leak when concurrent nfsd4_open occur dm thin: Add missing destroy_work_on_stack() util_macros.h: fix/rework find_closest() macros ftrace: Fix regression with module command in stack_trace_filter ovl: Filter invalid inodes with missing lookup function media: gspca: ov534-ov772x: Fix off-by-one error in set_frame_rate() media: venus: Fix pm_runtime_set_suspended() with runtime pm enabled media: ts2020: fix null-ptr-deref in ts2020_probe() media: i2c: tc358743: Fix crash in the probe error path when using polling btrfs: ref-verify: fix use-after-free after invalid ref action quota: flush quota_release_work upon quota writeback SUNRPC: correct error code comment in xs_tcp_setup_socket() um/sysrq: remove needless variable sp ALSA: hda/realtek: Set PCBeep to default value for ALC274 Revert "serial: sh-sci: Clean sci_ports[0] after at earlycon exit" serial: sh-sci: Clean sci_ports[0] after at earlycon exit ipmr: convert /proc handlers to rcu_read_lock() mfd: intel_soc_pmic_bxtwc: Use IRQ domain for USB Type-C device mfd: intel_soc_pmic_bxtwc: Use dev_err_probe() x86/xen/pvh: Annotate indirect branch as safe CIP: Bump version suffix to -cip116 after merge from stable Mark this as 4.19.324-cip115 release. CIP: Bump version suffix to -cip114 after merge from stable Mark this as 4.19.322-cip113 release. CIP: Bump version suffix to -cip112 after merge from stable CIP: Bump version suffix to -cip111 after merge from stable CIP: Bump version suffix to -cip110 after merge from stable CIP: Bump version suffix to -cip109 after merge from stable CIP: Bump version suffix to -cip108 after merge from stable memory: renesas-rpc-if: Clear HS bit during hardware initialization arm64: dts: renesas: rzg2: Add RPC-IF Support spi: spi-rpc-if: Check return value of rpcif_sw_init() memory: renesas-rpc-if: Remove redundant division of dummy memory: renesas-rpc-if: Simplify single/double data register access memory: renesas-rpc-if: Drop usage of RPCIF_DIRMAP_SIZE macro memory: renesas-rpc-if: Return error in case devm_ioremap_resource() fails memory: renesas-rpc-if: Fix HF/OSPI data transfer in Manual Mode memory: renesas-rpc-if: Correct QSPI data transfer in Manual mode memory: renesas-rpc-if: fix possible NULL pointer dereference of resource CIP: Bump version suffix to -cip107 after merge from stable ravb: remove undocumented counter processing ravb: remove undocumented endianness selection ravb: update "undocumented" annotations CIP: Bump version suffix to -cip106 after merge from stable Mark this as 4.19.299-cip105 release. CIP: Bump version suffix to -cip104 after merge from stable CIP: Bump version suffix to -cip103 after merge from stable CIP: Bump version suffix to -cip102 after merge from stable CIP: Bump version suffix to -cip101 after merge from stable CIP: Bump version suffix to -cip100 after merge from stable CIP: Bump version suffix to -cip99 after merge from stable CIP: Bump version suffix to -cip98 after merge from stable CIP: Bump version suffix to -cip97 after merge from stable CIP: Bump version suffix to -cip96 after merge from stable CIP: Bump version suffix to -cip95 after merge from stable CIP: Bump version suffix to -cip94 after merge from stable CIP: Bump version suffix to -cip93 after merge from stable CIP: Bump version suffix to -cip92 after merge from stable CIP: Bump version suffix to -cip91 after merge from stable CIP: Bump version suffix to -cip90 after merge from stable CIP: Bump version suffix to -cip89 after merge from stable CIP: Bump version suffix to -cip88 after merge from stable CIP: Bump version suffix to -cip87 after merge from stable CIP: Bump version suffix to -cip86 after merge from stable CIP: Bump version suffix to -cip85 after merge from stable CIP: Bump version suffix to -cip84 after merge from stable CIP: Bump version suffix to -cip83 after merge from stable CIP: Bump version suffix to -cip82 after merge from stable CIP: Bump version suffix to -cip81 after merge from stable drm: rcar-du: Fix Alpha blending issue on Gen3 CIP: Bump version suffix to -cip80 after merge from stable CIP: Bump version suffix to -cip79 after merge from stable CIP: Bump version suffix to -cip78 after merge from stable CIP: Bump version suffix to -cip77 after merge from stable CIP: Bump version suffix to -cip76 after merge from stable CIP: Bump version suffix to -cip75 after merge from stable CIP: Bump version suffix to -cip74 after merge from stable CIP: Bump version suffix to -cip73 after merge from stable CIP: Bump version suffix to -cip72 after merge from stable CIP: Bump version suffix to -cip71 after merge from stable CIP: Bump version suffix to -cip70 after merge from stable CIP: Bump version suffix to -cip69 after merge from stable CIP: Bump version suffix to -cip68 after merge from stable CIP: Bump version suffix to -cip67 after merge from stable CIP: Bump version suffix to -cip66 after merge from stable CIP: Bump version suffix to -cip65 after merge from stable CIP: Bump version suffix to -cip64 after merge from stable CIP: Bump version suffix to -cip63 after merge from stable CIP: Bump version suffix to -cip62 after merge from stable CIP: Bump version suffix to -cip61 after merge from stable CIP: Bump version suffix to -cip60 after merge from stable CIP: Bump version suffix to -cip59 after merge from stable CIP: Bump version suffix to -cip58 after merge from stable CIP: Bump version suffix to -cip57 after merge from stable CIP: Bump version suffix to -cip56 after merge from stable CIP: Bump version suffix to -cip55 after merge from stable CIP: Bump version suffix to -cip54 after merge from stable CIP: Bump version suffix to -cip53 after merge from stable CIP: Bump version suffix to -cip52 after merge from stable CIP: Bump version suffix to -cip51 after merge from stable CIP: Bump version suffix to -cip50 after merge from stable CIP: Bump version suffix to -cip49 after merge from stable media: i2c: imx219: Balance runtime PM use-count media: i2c: imx219: Move out locking/unlocking of vflip and hflip controls from imx219_set_stream CIP: Bump version suffix to -cip48 after merge from stable drm: rcar-du: Fix crash when using LVDS1 clock for CRTC CIP: Bump version suffix to -cip47 after merge from stable CIP: Bump version suffix to -cip46 after merge from stable arm64: dts: renesas: Add support for MIPI Adapter V2.1 connected to HiHope RZ/G2N arm64: dts: renesas: Add support for MIPI Adapter V2.1 connected to HiHope RZ/G2M arm64: dts: renesas: Add support for MIPI Adapter V2.1 connected to HiHope RZ/G2H arm64: dts: renesas: aistarvision-mipi-adapter-2.1: Add parent macro for each sensor arm64: dts: renesas: r8a774e1: Add VIN and CSI-2 nodes media: rcar-csi2: Enable support for R8A774E1 media: dt-bindings: media: renesas,csi2: Add R8A774E1 support media: rcar-vin: Enable support for R8A774E1 media: dt-bindings: media: renesas,vin: Add R8A774E1 support arm64: dts: renesas: r8a774b1: Add VIN and CSI-2 support media: rcar-csi2: Enable support for R8A774B1 media: dt-bindings: rcar-csi2: Add R8A774B1 support media: rcar-vin: Enable support for R8A774B1 media: dt-bindings: rcar-vin: Add R8A774B1 support arm64: dts: renesas: r8a774a1: Add VIN and CSI-2 nodes media: rcar-csi2: Enable support for r8a774a1 media: dt-bindings: media: rcar-csi2: Add r8a774a1 support media: rcar-vin: Enable support for r8a774a1 media: dt-bindings: media: rcar_vin: Add r8a774a1 support arm64: dts: renesas: r8a774c0-cat874: Add support for AISTARVISION MIPI Adapter V2.1 media: i2c: imx219: take lock in imx219_enum_mbus_code/frame_size media: i2c: imx219: Selection compliance fixes media: i2c: imx219: Fix a bug in imx219_enum_frame_size media: i2c: imx219: Implement get_selection media: i2c: imx219: Add support for cropped 640x480 resolution media: i2c: imx219: Add support for RAW8 bit bayer format media: i2c: imx219: Fix power sequence media: i2c: Add driver for Sony IMX219 sensor media: dt-bindings: media: i2c: Add IMX219 CMOS sensor binding media: rcar-csi2: Add support for MEDIA_BUS_FMT_SRGGB8_1X8 format media: rcar-vin: Add support for MEDIA_BUS_FMT_SRGGB8_1X8 format media: rcar-vin: Invalidate pipeline if conversion is not possible on input formats media: rcar-csi2: Update V3M and E3 start procedure media: rcar-vin: fix wrong return value in rvin_set_channel_routing() media: v4l: ctrl: Provide unlocked variant of v4l2_ctrl_grab media: v4l2-async: Log message in case of heterogeneous fwnode match media: v4l2-async: Pass notifier pointer to match functions media: v4l2-async: Accept endpoints and devices for fwnode matching media: device property: Add a function to test is a fwnode is a graph endpoint media: ov5645: Remove unneeded regulator_set_voltage() CIP: Bump version suffix to -cip45 after merge from stable CIP: Bump version suffix to -cip44 after merge from stable CIP: Bump version suffix to -cip43 after merge from stable CIP: Bump version suffix to -cip42 after merge from stable CIP: Bump version suffix to -cip41 after merge from stable spi: spi-mem: Make spi_mem_default_supports_op() static inline pinctrl: renesas: r8a77965: Add QSPI[01] pins, groups and functions pinctrl: renesas: r8a7796: Add QSPI[01] pins, groups and functions pinctrl: renesas: r8a77951: Add QSPI[01] pins, groups and functions pinctrl: renesas: r8a77990: Add QSPI[01] pins, groups and functions pinctrl: renesas: r8a77990: Optimize pinctrl image size for R8A774C0 pinctrl: renesas: r8a77965: Optimize pinctrl image size for R8A774B1 pinctrl: renesas: r8a77951: Optimize pinctrl image size for R8A774E1 pinctrl: renesas: r8a7796: Optimize pinctrl image size for R8A774A1 clk: renesas: r8a774c0: Add RPC clocks clk: renesas: r8a774b1: Add RPC clocks clk: renesas: r8a774a1: Add RPC clocks spi: rpc-if: Fix use-after-free on unbind spi: add Renesas RPC-IF driver spi: spi-mem: Fix a memory leak in spi_mem_dirmap_destroy() spi: spi-mem: Fix spi_mem_dirmap_destroy() kerneldoc spi: spi-mem: Add a new API to support direct mapping spi: spi-mem: Compute length only when needed spi: spi-mem: Fix passing zero to 'PTR_ERR' warning spi: spi-mem: fix reference leak in spi_mem_access_start spi: spi-mem: Split spi_mem_exec_op() code spi: spi-mem: export spi_mem_default_supports_op() spi: spi-mem: Add SPI_MEM_NO_DATA to the spi_mem_data_dir enum memory: renesas-rpc-if: Make rpcif_enable/disable_rpm() as static inline memory: renesas-rpc-if: Fix a node reference leak in rpcif_probe() memory: renesas-rpc-if: Fix unbalanced pm_runtime_enable in rpcif_{enable,disable}_rpm memory: renesas-rpc-if: Return correct value to the caller of rpcif_manual_xfer() memory: add Renesas RPC-IF driver dt-bindings: memory: document Renesas RPC-IF bindings dt-bindings: thermal: rcar-gen3-thermal: Add r8a774e1 support dt-bindings: PCI: rcar-pci-host: Document r8a774e1 bindings dt-bindings: PCI: rcar: Add device tree support for r8a774b1 dt-bindings: timer: renesas: tmu: Document r8a774e1 bindings dt-bindings: pci: rcar-pci-ep: Document missing interrupts property CIP: Bump version suffix to -cip40 after merge from stable arm64: dts: renesas: r8a774c0: Fix MSIOF1 DMA channels CIP: Bump version suffix to -cip39 after merge from stable arm64: dts: renesas: r8a774e1: Add audio support arm64: dts: renesas: r8a774e1: Add missing audio_clk_b CIP: Bump version suffix to -cip38 after merge from stable arm64: dts: renesas: r8a774e1: Add USB-DMAC and HSUSB device nodes arm64: dts: renesas: r8a774e1: Add USB3.0 device nodes arm64: dts: renesas: r8a774e1: Add USB2.0 phy and host (EHCI/OHCI) device nodes dt-bindings: dma: renesas,usb-dmac: Add binding for r8a774e1 dt-bindings: phy: renesas,usb3-phy: Add r8a774e1 support dt-bindings: phy: renesas,usb2-phy: Add r8a774e1 support dt-bindings: sound: renesas, rsnd: Document r8a774e1 bindings arm64: dts: renesas: Add HiHope RZ/G2H board with idk-1110wr display arm64: dts: renesas: r8a774e1: Add PWM device nodes dt-bindings: pwm: renesas,pwm-rcar: Add r8a774e1 support arm64: dts: renesas: r8a774e1-hihope-rzg2h: Setup DU clocks arm64: dts: renesas: r8a774e1: Add LVDS device node drm: rcar-du: lvds: Add support for R8A774E1 SoC dt-bindings: display: renesas,lvds: Document r8a774e1 bindings arm64: dts: renesas: r8a774e1: Populate HDMI encoder node dt-bindings: display: renesas,dw-hdmi: Add r8a774e1 support arm64: dts: renesas: r8a774e1: Populate DU device node drm: rcar-du: Add support for R8A774E1 SoC dt-bindings: display: renesas,du: Document r8a774e1 bindings arm64: dts: renesas: r8a774e1: Add FDP1 device nodes arm64: dts: renesas: r8a774e1: Add VSP instances arm64: dts: renesas: r8a774e1: Add FCPF and FCPV instances arm64: dts: renesas: r8a774e1-hihope-rzg2h-ex: Enable sata misc: pci_endpoint_test: Add Device ID for RZ/G2H PCIe controller arm64: dts: renesas: r8a774e1: Add PCIe EP nodes dt-bindings: pci: rcar-pci-ep: Document r8a774e1 arm64: dts: renesas: r8a774e1: Add SATA controller node arm64: dts: renesas: r8a774e1: Add PCIe device nodes misc: pci_endpoint_test: Add Device ID for RZ/G2M and RZ/G2N PCIe controllers arm64: dts: renesas: r8a774b1: Add PCIe EP nodes arm64: dts: renesas: r8a774a1: Add PCIe EP nodes arm64: dts: renesas: r8a774c0: Add PCIe EP node dt-bindings: pci: rcar-pci-ep: Document r8a774a1 and r8a774b1 ata: sata_rcar: Fix DMA boundary mask arm64: dts: renesas: r8a774b1-hihope-rzg2n-ex: Enable sata arm64: dts: renesas: r8a774b1: Add SATA controller node dt-bindings: ata: sata_rcar: Add r8a774b1 support CIP: Bump version suffix to -cip37 after merge from stable misc: pci_endpoint_test: Add Device ID for RZ/G2E PCIe controller arm64: defconfig: Enable R-Car PCIe endpoint driver PCI: rcar: Add endpoint mode support dt-bindings: PCI: rcar: Add bindings for R-Car PCIe endpoint controller PCI: rcar: Fix calculating mask for PCIEPAMR register PCI: rcar: Move shareable code to a common file arm64: defconfig: Enable CONFIG_PCIE_RCAR_HOST PCI: rcar: Rename pcie-rcar.c to pcie-rcar-host.c PCI: endpoint: functions/pci-epf-test: Print throughput information PCI: endpoint: Add support to handle multiple base for mapping outbound memory PCI: endpoint: Pass page size as argument to pci_epc_mem_init() PCI: endpoint: Fix ->set_msix() to take BIR and offset as arguments PCI: pci-epf-test: Add support to defer core initialization PCI: endpoint: Add notification for core init completion PCI: endpoint: Add core init notifying feature PCI: endpoint: Assign function number for each PF in EPC core PCI: endpoint: Protect concurrent access to pci_epf_ops with mutex PCI: endpoint: Replace spinlock with mutex PCI: endpoint: Use notification chain mechanism to notify EPC events to EPF tools: PCI: Fix fd leakage tools: PCI: Exit with error code when test fails PCI: dwc: Fix dw_pcie_ep_raise_msix_irq() to get correct MSI-X table address PCI: endpoint: Fix clearing start entry in configfs PCI: endpoint: Cast the page number to phys_addr_t PCI: endpoint: Clear BAR before freeing its space PCI: endpoint: Skip odd BAR when skipping 64bit BAR PCI: endpoint: Allocate enough space for fixed size BAR PCI: endpoint: Set endpoint controller pointer to NULL PCI: endpoint: Add support to specify alignment for buffers allocated to BARs PCI: endpoint: Fix a potential NULL pointer dereference PCI: endpoint: Remove features member in struct pci_epc PCI: designware-plat: Remove setting epc->features in Designware plat EP driver PCI: rockchip: Remove pci_epf_linkup() from Rockchip EP driver PCI: cadence: Remove pci_epf_linkup() from Cadence EP driver PCI: pci-epf-test: Use pci_epc_get_features() to get EPC features PCI: pci-epf-test: Do not allocate next BARs memory if current BAR is 64Bit PCI: pci-epf-test: Remove setting epf_bar flags in function driver PCI: endpoint: Fix pci_epf_alloc_space() to set correct MEM TYPE flags PCI: endpoint: Add helper to get first unreserved BAR PCI: cadence: Populate ->get_features() cdns_pcie_epc_ops PCI: rockchip: Populate ->get_features() dw_pcie_ep_ops PCI: pci-dra7xx: Populate ->get_features() dw_pcie_ep_ops PCI: designware-plat: Populate ->get_features() dw_pcie_ep_ops PCI: dwc: Add ->get_features() callback function to dw_pcie_ep_ops PCI: endpoint: Add new pci_epc_ops to get EPC features CIP: Bump version suffix to -cip36 after merge from stable with ravb fix Revert "ravb: Fixed to be able to unload modules" CIP: Bump version suffix to -cip35 after merge from stable CIP: Bump version suffix to -cip34 after merge from stable arm64: dts: renesas: Fix SD Card/eMMC interface device node names arm64: dts: renesas: r8a774e1: Add RWDT node dt-bindings: watchdog: renesas,wdt: Document r8a774e1 support arm64: dts: renesas: r8a774e1: Add MSIOF nodes spi: renesas,sh-msiof: Add r8a774e1 support arm64: dts: renesas: r8a774e1: Add I2C and IIC-DVFS support dt-bindings: i2c: renesas,iic: Document r8a774e1 support dt-bindings: i2c: renesas,i2c: Document r8a774e1 support arm64: dts: renesas: r8a774e1: Add SDHI nodes mmc: renesas_sdhi_internal_dmac: Add r8a774e1 support arm64: dts: renesas: r8a774e1: Add SCIF and HSCIF nodes arm64: dts: renesas: r8a774e1: Add CAN[FD] support can: rcar_can: Remove unused platform data support arm64: dts: renesas: r8a774e1: Add TMU device nodes arm64: dts: renesas: r8a774e1: Add CMT device nodes arm64: dts: renesas: r8a774e1: Add RZ/G2H thermal support thermal: rcar_gen3_thermal: Add r8a774e1 support thermal/drivers/rcar_gen3: Fix undefined temperature if negative thermal: rcar_gen3_thermal: Generate interrupt when temperature changes thermal: rcar_gen3_thermal: Remove temperature bound arm64: dts: renesas: r8a774e1: Add operating points arm64: dts: renesas: r8a774e1: Add Ethernet AVB node arm64: dts: renesas: r8a774e1: Add GPIO device nodes arm64: dts: renesas: r8a774e1: Add SYS-DMAC device nodes dt-bindings: dma: renesas,rcar-dmac: Document R8A774E1 bindings arm64: dts: renesas: r8a774e1: Add IPMMU device nodes iommu/ipmmu-vmsa: Hook up R8A774E1 DT matching code dt-bindings: iommu: renesas,ipmmu-vmsa: Add r8a774e1 support arm64: dts: renesas: Add HiHope RZ/G2H sub board support arm64: dts: renesas: Add HiHope RZ/G2H main board support dt-bindings: arm: renesas: Add HopeRun RZ/G2H boards arm64: dts: renesas: Initial r8a774e1 SoC device tree pinctrl: sh-pfc: pfc-r8a77951: Add R8A774E1 PFC support dt-bindings: pinctrl: sh-pfc: Document r8a774e1 PFC support pinctrl: sh-pfc: Split R-Car H3 support in two independent drivers pinctrl: sh-pfc: pfc-r8a7795: Fix typo in pinmux macro for SCL3 pinctrl: sh-pfc: pfc-r8a7795-es1: Fix typo in pinmux macro for SCL3 pinctrl: sh-pfc: r8a7795: Use new macros for non-GPIO pins pinctrl: sh-pfc: r8a7795-es1: Use new macros for non-GPIO pins pinctrl: sh-pfc: r8a7795: Add TPU pins, groups and functions pinctrl: sh-pfc: r8a7795-es1: Add TPU pins, groups and functions pinctrl: sh-pfc: rcar-gen3: Rename RTS{0,1,3,4}# pin function definitions pinctrl: sh-pfc: rcar-gen3: Retain TDSELCTRL register across suspend/resume pinctrl: sh-pfc: r8a7795: Deduplicate VIN5 pin definitions pinctrl: sh-pfc: r8a7795: Add I2C{0,3,5} pins, groups and functions pinctrl: sh-pfc: r8a7795-es1: Add I2C{0,3,5} pins, groups and functions pinctrl: sh-pfc: r8a7795: Fix VIN versioned groups pinctrl: sh-pfc: r8a77965: Fix DU_DOTCLKIN3 drive/bias control arm64: defconfig: Enable R8A774E1 SoC clk: renesas: cpg-mssr: Add r8a774e1 support dt-bindings: clock: renesas,cpg-mssr: Document r8a774e1 clk: renesas: rzg2: Mark RWDT clocks as critical clk: renesas: cpg-mssr: Mark clocks as critical only if on at boot clk: renesas: rcar-gen3: Allow changing the RPC[D2] clocks clk: renesas: Add r8a774e1 CPG Core Clock Definitions clk: renesas: rcar-gen3: Add RPC clocks soc: renesas: rcar-rst: Add support for RZ/G2H dt-bindings: reset: rcar-rst: Document r8a774e1 reset module soc: renesas: Identify RZ/G2H dt-bindings: arm: renesas: Document RZ/G2H SoC DT bindings soc: renesas: Add Renesas R8A774E1 config option soc: renesas: rcar-sysc: Add r8a774e1 support dt-bindings: power: renesas,rcar-sysc: Document r8a774e1 SYSC binding dt-bindings: power: Add r8a774e1 SYSC power domain definitions arm64: dts: renesas: r8a774a1: Remove audio port node arm64: dts: renesas: Add HiHope RZ/G2N Rev2.0/3.0/4.0 board with idk-1110wr display arm64: dts: renesas: Add HiHope RZ/G2N Rev.3.0/4.0 sub board support arm64: dts: renesas: Add HiHope RZ/G2N Rev.3.0/4.0 main board support arm64: dts: renesas: Add HiHope RZ/G2M Rev.3.0/4.0 board with idk-1110wr display arm64: dts: renesas: hihope-rzg2-ex: Separate out lvds specific nodes into common file arm64: dts: renesas: Add HiHope RZ/G2M Rev.3.0/4.0 sub board support arm64: dts: renesas: Add HiHope RZ/G2M Rev.3.0/4.0 main board support arm64: dts: renesas: Add HiHope RZ/G2M[N] Rev.3.0/4.0 specific into common file arm64: dts: renesas: hihope-common: Separate out Rev.2.0 specific into hihope-rev2.dtsi file arm64: dts: renesas: r8a774b1-hihope-rzg2n[-ex]: Rename HiHope RZ/G2N boards arm64: dts: renesas: r8a774a1-hihope-rzg2m[-ex/-ex-idk-1110wr]: Rename HiHope RZ/G2M boards CIP: Bump version suffix to -cip33 after merge from stable drm: atomic helper: fix W=1 warnings drm: Add drm_atomic_get_old/new_private_obj_state drm: of: Fix linking when CONFIG_OF is not set CIP: Bump version suffix to -cip32 after merge from stable drm: of: Fix double-free bug CIP: Bump version suffix to -cip31 after merge from stable arm64: dts: renesas: Add EK874 board with idk-2121wr display support dt-bindings: display: Add idk-2121wr binding arm64: dts: renesas: rzg2: Add reset control properties for display arm64: dts: renesas: r8a774c0: Point LVDS0 to its companion LVDS1 drm: rcar-du: lvds: Allow for even and odd pixels swap drm: rcar-du: lvds: Get dual link configuration from DT drm: of: Add drm_of_lvds_get_dual_link_pixel_order drm: rcar-du: lvds: Improve identification of panels drm: rcar-du: lvds: Get mode from state drm: Add atomic variants for bridge enable/disable drm: Add drm_atomic_get_(old|new)_connector_for_encoder() helpers drm: rcar_lvds: Fix dual link mode operations drm: rcar-du: Skip LVDS1 output on Gen3 when using dual-link LVDS mode drm: rcar-du: lvds: Add support for dual-link mode dt-bindings: display: renesas: lvds: Add renesas,companion property drm: bridge: Add dual_link field to the drm_bridge_timings structure drm: rcar-du: lvds: Remove LVDS double-enable checks arm64: defconfig: Enable additional support for Renesas platforms ASoC: rsnd: fixup SSI clock during suspend/resume modes CIP: Bump version suffix to -cip30 after merge from stable CIP: Bump version suffix to -cip29 after merge from stable CIP: Bump version suffix to -cip28 after merge from stable CIP: Bump version suffix to -cip27 after merge from stable CIP: Bump version suffix to -cip26 after merge from stable CIP: Bump version suffix to -cip25 after merge from stable arm64: dts: renesas: Add HiHope RZ/G2M board with idk-1110wr display dt-bindings: display: Add idk-1110wr binding CIP: Bump version suffix to -cip24 after merge from stable CIP: Bump version suffix to -cip23 after merge from stable CIP: Bump version suffix to -cip22 after merge from stable CIP: Bump version suffix to -cip21 after merge from stable arm64: dts: renesas: cat874: Enable usb role switch support arm64: dts: renesas: cat874: Enable USB3.0 host/peripheral device node usb: gadget: udc: renesas_usb3: Enhance role switch support usb: typec: fix an IS_ERR() vs NULL bug in hd3ss3220_probe() usb: typec: hd3ss3220: hd3ss3220_probe() warn: passing zero to 'PTR_ERR' usb: typec: add dependency for TYPEC_HD3SS3220 usb: typec: hd3ss3220_irq() can be static usb: typec: driver for TI HD3SS3220 USB Type-C DRP port controller dt-bindings: usb: renesas_usb3: Document usb role switch support dt-bindings: usb: hd3ss3220 device tree binding document usb: roles: Add fwnode_usb_role_switch_get() function device connection: Add fwnode_connection_find_match() usb: roles: Introduce stubs for the exiting functions in role.h device connection: Find connections also by checking the references device property: Introduce fwnode_find_reference() device connection: Find device connections also from device graphs device connection: Prepare support for firmware described connections usb: typec: Find the ports by also matching against the device node usb: roles: Find the muxes by also matching against the device node usb: typec: mux: Fix unsigned comparison with less than zero usb: typec: mux: Find the muxes by also matching against the device node device connection: Add fwnode member to struct device_connection CIP: Bump version suffix to -cip20 after merge from stable arm64: dts: renesas: r8a774b1: Add USB3.0 device nodes arm64: dts: renesas: r8a774b1: Add USB-DMAC and HSUSB device nodes arm64: dts: renesas: r8a774b1: Add USB2.0 phy and host (EHCI/OHCI) device nodes dt-bindings: usb: renesas_usb3: Document r8a774b1 support dt-bindings: usb: renesas_gen3: Rename bindings documentation file to reflect IP block dt-bindings: usb-xhci: Add r8a774b1 support dt-bindings: rcar-gen3-phy-usb3: Add r8a774b1 support dt-bindings: usb: renesas_usbhs: Add r8a774b1 support dt-bindings: usb: renesas_usbhs: Rename bindings documentation file dt-bindings: dmaengine: usb-dmac: Add binding for r8a774b1 dt-bindings: rcar-gen3-phy-usb2: Add r8a774b1 support arm64: dts: renesas: r8a774b1: Add Sound and Audio DMAC device nodes ASoC: rsnd: Document r8a774b1 bindings arm64: dts: renesas: r8a774a1: Remove audio port node arm64: dts: renesas: Add support for Advantech idk-1110wr LVDS panel arm64: dts: renesas: hihope-rzg2-ex: Add LVDS support drm: rcar-du: lvds: Add r8a774b1 support arm64: dts: renesas: hihope-rzg2-ex: Enable backlight arm64: dts: renesas: r8a774b1: Add PWM device nodes arm64: dts: renesas: r8a774b1: Add FDP1 device nodes arm64: dts: renesas: r8a774b1-hihope-rzg2n: Add display clock properties arm64: dts: renesas: r8a774b1: Add HDMI encoder instance arm64: dts: renesas: r8a774b1: Add DU device to DT drm: rcar-du: Add R8A774B1 support arm64: dts: renesas: hihope-common: Move du clk properties out of common dtsi arm64: dts: renesas: r8a774b1: Connect Ethernet-AVB to IPMMU-DS0 arm64: dts: renesas: r8a774b1: Tie SYS-DMAC to IPMMU-DS0/1 arm64: dts: renesas: r8a774b1: Add VSP instances arm64: dts: renesas: r8a774b1: Add FCPF and FCPV instances arm64: dts: renesas: r8a774b1: Add IPMMU device nodes iommu/ipmmu-vmsa: Hook up r8a774b1 DT matching code dt-bindings: iommu: ipmmu-vmsa: Add r8a774b1 support arm64: dts: renesas: r8a774b1: Add CAN and CAN FD support dt-bindings: can: rcar_canfd: document r8a774b1 support dt-bindings: can: rcar_can: document r8a774b1 support arm64: dts: renesas: r8a774b1: Add TMU device nodes clk: renesas: r8a774b1: Add TMU clock dt-bindings: timer: renesas: tmu: Document r8a774b1 bindings arm64: dts: renesas: r8a774b1: Add CMT device nodes dt-bindings: timer: renesas, cmt: Document r8a774b1 CMT support arm64: dts: renesas: r8a774b1: Add RZ/G2N thermal support thermal: rcar_gen3_thermal: Add r8a774b1 support dt-bindings: thermal: rcar-gen3-thermal: Add r8a774b1 support arm64: dts: renesas: r8a774b1: Add OPPs table for cpu devices arm64: dts: renesas: r8a774b1: Add I2C and IIC-DVFS support dt-bindings: i2c: sh_mobile: Add r8a774b1 support dt-bindings: i2c: sh_mobile: Rename bindings documentation file dt-bindings: i2c: rcar: Add r8a774b1 support dt-bindings: i2c: rcar: Rename bindings documentation file arm64: dts: renesas: r8a774b1-hihope-rzg2n: Enable HS400 mode arm64: dts: renesas: r8a774b1: Add SDHI support mmc: renesas_sdhi_internal_dmac: Add r8a774b1 support dt-bindings: mmc: renesas_sdhi: Add r8a774b1 support arm64: dts: renesas: r8a774b1: Add INTC-EX device node arm64: dts: renesas: hihope-rzg2-ex: Let the board specific DT decide about pciec1 arm64: dts: renesas: r8a774b1: Add PCIe device nodes arm64: dts: renesas: r8a774b1: Add all MSIOF nodes arm64: dts: renesas: r8a774b1: Add RWDT node dt-bindings: watchdog: renesas-wdt: Document r8a774b1 support dt-bindings: watchdog: Rename bindings documentation file dt-bindings: spi: sh-msiof: Add r8a774b1 support arm64: dts: renesas: Add HiHope RZ/G2N sub board support arm64: dts: renesas: r8a774b1: Add Ethernet AVB node dt-bindings: net: ravb: Add support for r8a774b1 SoC arm64: dts: renesas: r8a774b1: Add GPIO device nodes dt-bindings: gpio: rcar: Add DT binding for r8a774b1 arm64: dts: renesas: r8a774b1: Add SCIF and HSCIF nodes arm64: dts: renesas: r8a774b1: Add SYS-DMAC device nodes dt-bindings: dmaengine: rcar-dmac: Document R8A774B1 bindings CIP: Bump version suffix to -cip19 after merge from stable arm64: dts: renesas: r8a774c0: cat874: Sort nodes arm64: dts: renesas: Use ip=on for bootargs arm64: dts: renesas: r8a774c0: cat874: Add definition for 12V regulator arm64: dts: renesas: Update 'vsps' properties for readability arm64: dts: renesas: r8a774c0: Fix register range of display node arm64: dts: renesas: r8a774c0: Add missing assigned-clocks for CAN[01] arm64: dts: renesas: r8a774c0: Clean up CPU compatibles arm64: dts: renesas: r8a774c0: Add dynamic power coefficient arm64: dts: renesas: r8a774c0: Create thermal zone to support IPA thermal: rcar_thermal: update calculation formula for R-Car Gen3 SoCs dt-bindings: can: rcar_can: Complete documentation for RZ/G2[EM] dt-bindings: can: rcar_can: document r8a77965 support CIP: Bump version suffix to -cip18 after merge from stable CIP: Bump version suffix to -cip17 after merge from stable arm64: defconfig: Enable R8A774B1 SoC arm64: dts: renesas: Add HiHope RZ/G2N main board support arm64: dts: renesas: Initial r8a774b1 SoC device tree dt-bindings: serial: sh-sci: Document r8a774b1 bindings pinctrl: sh-pfc: pfc-r8a77965: Fix typo in pinmux macro for SCL3 pinctrl: sh-pfc: r8a77965: Add R8A774B1 PFC support dt-bindings: pinctrl: sh-pfc: Document r8a774b1 PFC support pinctrl: sh-pfc: r8a77965: Use new macros for non-GPIO pins pinctrl: sh-pfc: r8a77965: Add TPU pins, groups and functions pinctrl: sh-pfc: r8a77965: Add I2C{0,3,5} pins, groups and functions pinctrl: sh-pfc: r8a77965: Add DRIF pins, groups and functions pinctrl: sh-pfc: r8a77965: Add TMU pins, groups and functions pinctrl: sh-pfc: r8a77965: Replace DU_DOTCLKIN2 by DU_DOTCLKIN3 pinctrl: sh-pfc: r8a77965: Add CAN FD pins, groups and functions pinctrl: sh-pfc: r8a77965: Add CAN pins, groups and functions pinctrl: sh-pfc: r8a77965: Add VIN[4|5] groups/functions pinctrl: sh-pfc: r8a77965: Add Audio SSI pin support pinctrl: sh-pfc: r8a77965: Add Audio clock pin support pinctrl: sh-pfc: r8a77965: Add SATA pins, groups and functions clk: renesas: cpg-mssr: Add r8a774b1 support dt-bindings: clock: renesas: cpg-mssr: Document r8a774b1 binding dt-bindings: clk: Add r8a774b1 CPG Core Clock Definitions soc: renesas: rcar-rst: Add support for RZ/G2N dt-bindings: reset: rcar-rst: Document r8a774b1 reset module soc: renesas: rcar-sysc: Add r8a774b1 support soc: renesas: r8a774c0-sysc: Fix power request conflicts soc: renesas: r8a77990-sysc: Fix power request conflicts soc: renesas: r8a77980-sysc: Fix power request conflicts soc: renesas: r8a77970-sysc: Fix power request conflicts soc: renesas: r8a77965-sysc: Fix power request conflicts soc: renesas: r8a7796-sysc: Fix power request conflicts soc: renesas: r8a7795-sysc: Fix power request conflicts soc: renesas: rcar-sysc: Prepare for fixing power request conflicts dt-bindings: power: rcar-sysc: Document r8a774b1 sysc dt-bindings: power: Add r8a774b1 SYSC power domain definitions soc: renesas: Identify RZ/G2N soc: renesas: Add Renesas R8A774B1 config option dt-bindings: arm: renesas: Add HopeRun RZ/G2N boards dt-bindings: arm: renesas: Document RZ/G2N SoC DT bindings CIP: Bump version suffix to -cip16 after merge from stable CIP: Bump version suffix to -cip15 after merge from stable gitlab-ci: Use external linux-cip-pipelines repository to define CI arm64: dts: renesas: r8a774a1: Add SSIU support for sound ASoC: rsnd: add SSIU BUSIF support ASoC: rsnd: add .get_id/.get_id_sub ASoC: rsnd: move .get_status under rsnd_mod_ops ASoC: rsnd: merge .nolock_start and .prepare ASoC: rsnd: ssiu: Support to init different BUSIF instance ASoC: rsnd: ssiu: Support BUSIF other than BUSIF0 ASoc: rsnd: dma: Calculate PDMACHCRE with consider of BUSIF ASoc: rsnd: dma: Calculate dma address with consider of BUSIF ASoC: rsnd: ssi: Check runtime channel number rather than hw_params ASoC: rsnd: ssi: Fix issue in dma data address assignment ASoC: rsnd: remove is_play parameter from hw_rule function ASoC: rsnd: add support for 8 bit S8 format ASoC: rsnd: add support for 16/24 bit slot widths ASoC: rsnd: add warning message to rsnd_kctrl_accept_runtime() CIP: Bump version suffix to -cip14 after merge from stable gitlab-ci: Remove test timeout gitlab-ci: Remove unofficial build configurations gitlab-ci: Split tests into separate jobs CIP: Bump version suffix to -cip13 after merge from stable arm64: dts: renesas: hihope-rzg2-ex: Enable CAN interfaces arm64: dts: renesas: r8a774a1: Add CANFD support arm64: dts: renesas: r8a774a1: Add missing assigned-clocks for CAN[01] dt-bindings: can: rcar_canfd: document r8a774a1 support arm64: dts: renesas: hihope-common: Add HDMI audio support arm64: dts: renesas: r8a774a1: Use extended audio dmac registers arm64: dts: renesas: cat874: Add BT support arm64: dts: renesas: cat874: Add WLAN support arm64: dts: renesas: hihope-common: Add WLAN support arm64: dts: renesas: hihope-common: Add BT support arm64: dts: renesas: hihope-common: Add PCA9654 I/O expander CIP: Bump version suffix to -cip12 after merge from stable arm64: dts: renesas: r8a774c0: Add CANFD support dt-bindings: can: rcar_canfd: document r8a774c0 support arm64: dts: renesas: cat874: Add HDMI audio arm64: dts: renesas: cat874: Add HDMI video support arm64: defconfig: Enable TDA19988 arm64: dts: renesas: r8a774c0: Add display output support media: use strscpy() instead of strlcpy() drm: rcar-du: Replace EXT_CTRL_REGS feature flag with generation check drm: rcar-du: Disable unused DPAD outputs drm/rcar-du: Use drm_fbdev_generic_setup() drm: rcar-du: Reject modes that fail CRTC timing requirements drm: rcar-du: Fix external clock error checks drm: rcar-du: Fix vblank initialization drm: rcar-du: Fix the return value in case of error in 'rcar_du_crtc_set_crc_source()' drm/rcar-du: Replace drm_dev_unref with drm_dev_put drm: rcar-du: Enable configurable DPAD0 routing on Gen3 drm: rcar-du: Improve non-DPLL clock selection drm: rcar-du: lvds: Adjust operating frequency for D3 and E3 drm: rcar-du: lvds: Fix post-DLL divider calculation drm: rcar-du: Turn LVDS clock output on/off for DPAD0 output on D3/E3 drm: rcar-du: lvds: Add API to enable/disable clock output drm: rcar-du: lvds: Don't fail probe if output is not connected on D3/E3 drm: rcar-du: Simplify encoder registration drm: rcar-du: Move CRTC outputs bitmask to private CRTC state drm: rcar-du: lvds: add R8A774C0 support drm: rcar-du: Add r8a774c0 device support drm: rcar-du: Use LVDS PLL clock as dot clock when possible drm: rcar-du: Perform the initial CRTC setup from rcar_du_crtc_get() drm: rcar-du: lvds: D3/E3 support dt-bindings: display: renesas: lvds: Document r8a774c0 bindings dt-bindings: display: renesas: lvds: Add EXTAL and DU_DOTCLKIN clocks dt-bindings: display: renesas: du: Document r8a774c0 bindings media: dt-bindings: media: renesas-fcp: Add RZ/G2 support media: vsp1: Add RZ/G support CIP: Bump version suffix to -cip11 after merge from stable gitlab-ci: Always store job artifacts gitlab-ci: Increase test timeout to 60 minutes arm64: dts: renesas: hihope-common: Add HDMI support arm64: dts: renesas: r8a774a1: Add HDMI encoder instance arm64: dts: renesas: r8a774a1: Connect Ethernet-AVB to IPMMU-DS0 arm64: dts: renesas: r8a774a1: Tie Audio-DMAC to IPMMU-MP arm64: dts: renesas: r8a774a1: Tie SYS-DMAC to IPMMU-DS0/1 arm64: dts: renesas: r8a774a1: Add FDP1 instance arm64: dts: renesas: r8a774a1: Add DU device to DT arm64: dts: renesas: r8a774a1: Add VSP instances arm64: dts: renesas: hihope-rzg2-ex: Enable PCIe support arm64: dts: renesas: hihope-common: Declare pcie bus clock arm64: dts: renesas: r8a774a1: Add PCIe device nodes drm: rcar-du: Update framebuffer pitch and alignment limits for Gen3 drm: rcar-du: Store V4L2 fourcc in rcar_du_format_info structure drm: rcar-du: Add support for missing pixel formats drm: rcar-du: Rename and document dpll_ch field drm: rcar-du: Rework clock configuration based on hardware limits drm: rcar-du: Support interlaced video output through vsp1 drm: rcar-du: Don't use TV sync mode when not supported by the hardware drm: rcar-du: Cache DSYSR value to ensure known initial value drm: rcar-du: Add interlaced feature flag drm: rcar-du: Refactor Feature and Quirk definitions drm: rcar-du: dw-hdmi: Reject modes with a too high clock frequency drm: rcar-du: lvds: Add r8a774a1 support drm: rcar-du: Add R8A774A1 support PCI: rcar: Do not shadow the 'irq' variable PCI: rcar: Clean up debug messages PCI: rcar: Replace various variable types with unsigned ones for register values PCI: rcar: Replace unsigned long with u32/unsigned int in register accessors dt-bindings: display: renesas: Add r8a774a1 support dt-bindings: display: renesas: lvds: Document r8a774a1 bindings dt-bindings: display: renesas: du: Document the r8a774a1 bindings dt-bindings: PCI: rcar: Add device tree support for r8a774a1 CIP: Bump version suffix to -cip10 after merge from stable arm64: dts: renesas: hihope-common: Enable USB3.0 arm64: dts: renesas: hihope-common: Add USB 2.0 support arm64: dts: renesas: r8a774a1: Fix USB 2.0 clocks phy: renesas: rcar-gen3-usb2: fix imbalance powered flag arm64: dts: renesas: hihope-common: Remove "label" from LEDs arm64: dts: renesas: hihope-common: Add LEDs support arm64: dts: renesas: hihope-common: Add uSD and eMMC mmc: renesas_sdhi: prevent overflow for max_req_size mmc: tmio: introduce macro for max block size mmc: renesas_sdhi: Change HW adjustment register according to speed mode arm64: dts: renesas: r8a774a1: Add dynamic power coefficient arm64: dts: renesas: r8a774a1: Create thermal zone to support IPA arm64: dts: renesas: r8a774a1: Add CPU capacity-dmips-mhz arm64: dts: renesas: r8a774a1: Add CPU topology on r8a774a1 SoC arm64: dts: renesas: r8a774a1: Add operating points thermal: rcar_gen3_thermal: Update temperature conversion method thermal: rcar_gen3_thermal: Update calculation formula of IRQTEMP thermal: rcar_gen3_thermal: Update value of Tj_1 thermal: rcar_gen3_thermal: Fix to show correct trip points number thermal: rcar_gen3_thermal: fix interrupt type thermal: rcar_gen3_thermal: Fix init value of IRQCTL register thermal: rcar_gen3_thermal: Register hwmon sysfs interface arm64: dts: renesas: r8a774a1: Add TMU device nodes clk: renesas: r8a774a1: Add TMU clock arm64: dts: renesas: r8a774a1: Add CMT device nodes arm64: dts: renesas: hihope-common: Add RWDT support watchdog: renesas_wdt: Add a few cycles delay watchdog: renesas_wdt: Use 'dev' instead of dereferencing it repeatedly watchdog: renesas_wdt: drop superfluous glob pattern watchdog: renesas_wdt: don't keep timer value during suspend/resume watchdog: renesas_wdt: Fix typos watchdog: renesas_wdt: stop when unregistering arm64: dts: renesas: Add HiHope RZ/G2M sub board support arm64: dts: renesas: hihope-common: Add pincontrol support to scif2/scif clock arm64: dts: renesas: Add HiHope RZ/G2M main board support dt-bindings: Add vendor prefix for HopeRun dt-bindings: arm: renesas: Add HopeRun RZ/G2[M] boards gitlab-ci: Start testing the r8a774a1-hihope-rzg2m-ex device arm64: dts: renesas: r8a774a1: Add clkp2 clock to CAN nodes arm64: dts: Remove inconsistent use of 'arm,armv8' compatible string arm64: dts: renesas: r8a774a1: Fix hsusb reg size arm64: dts: renesas: r8a774a1: Enable DMA for SCIF2 arm64: dts: renesas: r8a774a1: Replace clock magic numbers arm64: dts: renesas: r8a774a1: Replace power magic numbers arm64: dts: renesas: r8a774a1: Add CAN nodes arm64: dts: renesas: Remove unneeded status from thermal nodes arm64: dts: renesas: Fix whitespace around assignments arm64: dts: renesas: r8a774a1: Add USB3.0 device nodes arm64: dts: renesas: r8a774a1: Add USB-DMAC and HSUSB device nodes arm64: dts: renesas: r8a774a1: Add USB2.0 phy and host(EHCI/OHCI) device nodes arm64: dts: renesas: r8a774a1: Add FCPF and FCPV instances arm64: dts: renesas: r8a774a1: Add audio support arm64: dts: renesas: r8a774a1: Add PWM device nodes arm64: dts: renesas: r8a774a1: Add Cortex-A53 CPU cores arm64: dts: renesas: r8a774a1: Add all MSIOF nodes arm64: dts: renesas: r8a774a1: Add IPMMU device nodes arm64: dts: renesas: r8a774a1: Add RZ/G2M thermal support arm64: dts: renesas: r8a774a1: Add I2C and IIC-DVFS support arm64: dts: renesas: r8a774a1: Add SDHI nodes arm64: dts: renesas: r8a774a1: Add GPIO device nodes arm64: dts: renesas: r8a774a1: Add pinctrl device node arm64: dts: renesas: r8a774a1: Add RWDT node arm64: dts: renesas: r8a774a1: Add Ethernet AVB node arm64: dts: renesas: r8a774a1: Add INTC-EX device node arm64: dts: renesas: r8a774a1: Add SCIF and HSCIF nodes arm64: dts: renesas: r8a774a1: Add SYS-DMAC controller nodes arm64: dts: renesas: Initial r8a774a1 SoC device tree mmc: renesas_sdhi_internal_dmac: set scatter/gather max segment size ravb: Avoid unsupported internal delay mode for R-Car E3/D3 ravb: remove tx buffer addr 4byte alilgnment restriction for R-Car Gen3 spi: sh-msiof: fix deferred probing dmaengine: rcar-dmac: Update copyright information dmaengine: rcar-dmac: set scatter/gather max segment size serial: sh-sci: Fix fallback to PIO in sci_dma_rx_complete() serial: sh-sci: Extract sci_dma_rx_reenable_irq() serial: sh-sci: Extract sci_dma_rx_chan_invalidate() serial: sh-sci: Fix crash in rx_timer_fn() on PIO fallback soc: renesas: rcar-sysc: Fix power domain control after system resume soc: renesas: rcar-sysc: Merge PM Domain registration and linking soc: renesas: rcar-sysc: Remove rcar_sysc_power_{down,up}() helpers clk: renesas: cpg-mssr: Remove error messages on out-of-memory conditions clk: renesas: cpg-mssr: Use genpd of_node instead of local copy gpio: rcar: Pedantic formatting gpio: rcar: select General Output Register to set output states gpio: rcar: reference device instead of platform device thermal: rcar_gen3_thermal: Add r8a774a1 support dt-bindings: dmaengine: usb-dmac: Add binding for r8a774a1 dt-bindings: thermal: rcar-gen3-thermal: Add r8a774a1 support dt-bindings: usb: renesas_usbhs: Add r8a774a1 support dt-bindings: usb-xhci: Add r8a774c0 support dt-bindings: usb-xhci: Add r8a774a1 support dt-bindings: rcar-gen3-phy-usb3: Add r8a774a1 support dt-bindings: can: rcar_can: Add r8a774c0 support dt-bindings: can: rcar_can: Fix RZ/G2 CAN clocks dt-bindings: can: rcar_can: Add r8a774a1 support pinctrl: sh-pfc: sh73a0: Use new macros for non-GPIO pins pinctrl: sh-pfc: sh73a0: Add missing TO pin to tpu4_to3 group pinctrl: sh-pfc: sh73a0: Fix fsic_spdif pin groups pinctrl: sh-pfc: r8a7791: Fix scifb2_data_c pin group pinctrl: sh-pfc: r8a7791: Fix VIN1 versioned groups pinctrl: sh-pfc: r8a7791: Remove bogus marks from vin1_b_data18 group pinctrl: sh-pfc: r8a7791: Remove bogus ctrl marks from qspi_data4_b group pinctrl: sh-pfc: r8a77995: Remove unused PINMUX_IPSR_{MSEL2,PHYS}() pinctrl: sh-pfc: r8a7740: Add missing LCD0 marks to lcd0_data24_1 group pinctrl: sh-pfc: r8a7740: Add missing REF125CK pin to gether_gmii group pinctrl: sh-pfc: r8a7796: Remove placeholder I2C pin data pinctrl: sh-pfc: r8a7796: Use new macros for non-GPIO pins pinctrl: sh-pfc: r8a7796: Add TPU pins, groups and functions pinctrl: sh-pfc: r8a77990: Use new macros for non-GPIO pins pinctrl: sh-pfc: Move PIN_NONE to shared header file pinctrl: sh-pfc: Add PORT_GP_27 helper macro pinctrl: sh-pfc: rcar-gen3: Rename SEL_NDFC to SEL_NDF pinctrl: sh-pfc: rcar-gen3: Rename RTS{0,1,3,4}# pin function definitions pinctrl: sh-pfc: r8a77990: Fix MOD_SEL1 bit30 when using SSI_SCK2 and SSI_WS2 pinctrl: sh-pfc: r8a77990: Fix MOD_SEL1 bit31 when using SIM0_D pinctrl: sh-pfc: r8a77990: Fix MOD_SEL0 bit16 when using NFALE and NFRB_N pinctrl: sh-pfc: rcar-gen3: Rename SEL_ADG_{A,B,C} to SEL_ADG{A,B,C} pinctrl: sh-pfc: rcar-gen3: Remove CC5_OSCOUT pin pinctrl: sh-pfc: rcar-gen3: Remove HDMI CEC pins, groups, and functions pinctrl: sh-pfc: Add missing #include <linux/errno.h> pinctrl: sh-pfc: rcar-gen3: Retain TDSELCTRL register across suspend/resume pinctrl: sh-pfc: r8a77990: Move CANFD pin groups and functions pinctrl: sh-pfc: r8a77990: Rename IOCTRLx registers pinctrl: sh-pfc: r8a7796: Move CANFD pin groups and functions pinctrl: sh-pfc: r8a7796: Deduplicate VIN5 pin definitions pinctrl: sh-pfc: r8a7796: Add I2C{0,3,5} pins, groups and functions pinctrl: sh-pfc: r8a7796: Fix VIN versioned groups pinctrl: sh-pfc: Validate pin tables at runtime pinctrl: sh-pfc: Add check for empty pinmux groups/functions pinctrl: sh-pfc: Mark run-time debug code __init pinctrl: sh-pfc: Correct printk level of group reference warning pinctrl: sh-pfc: Add new non-GPIO helper macros pinctrl: sh-pfc: Add SH_PFC_PIN_CFG_PULL_UP_DOWN shorthand pinctrl: sh-pfc: Rename 2-parameter CPU_ALL_PORT() variant pinctrl: sh-pfc: Improve PINMUX_IPSR_PHYS() documentation pinctrl: sh-pfc: Validate enum IDs for regs with variable-width fields pinctrl: sh-pfc: Validate enum IDs for regs with fixed-width fields pinctrl: sh-pfc: Absorb enum IDs in PINMUX_DATA_REG() macro pinctrl: sh-pfc: Absorb enum IDs in PINMUX_CFG_REG_VAR() macro pinctrl: sh-pfc: Absorb enum IDs in PINMUX_CFG_REG() macro pinctrl: sh-pfc: Validate fixed-size field widths at build time pinctrl: sh-pfc: Make pinmux_cfg_reg.var_field_width[] variable-length pinctrl: sh-pfc: Validate pins/marks in pin groups at build time pinctrl: sh-pfc: Add physical pin multiplexing helper macros pinctrl: sh-pfc: Validate pinmux tables at runtime when debugging pinctrl: sh-pfc: Print actual field width for variable-width fields CIP: Bump version suffix to -cip9 after merge from stable staging: m57621-mmc: delete driver from the tree. CIP: Bump version suffix to -cip8 after merge from stable Update to run all CIP arm, arm64 and x86 configs Update CI to use the latest linux-cip-ci containers CIP: Bump version suffix to -cip7 after merge from stable arm64: dts: renesas: r8a774c0: sort subnodes of the soc node arm64: dts: renesas: r8a774c0: Remove invalid compatible value for CSI40 arm64: dts: renesas: r8a774c0: Fix SCIF5 DMA channels arm64: dts: renesas: r8a774c0: Enable DMA for SCIF2 arm64: dts: renesas: r8a774c0-cat874: Add RWDT support arm64: dts: renesas: r8a774c0-cat874: Add LEDs support arm64: dts: renesas: r8a774c0-cat874: add RTC support arm64: defconfig: enable RX-8581 config option rtc: rx8581: Add support for Epson rx8571 RTC dt-bindings: rtc: add rx8571 compatible rtc: nvmem: remove nvmem from struct rtc_device rtc: nvmem: use devm_nvmem_register() arm64: dts: renesas: cat874: Add USB-HOST support phy: renesas: rcar-gen3-usb2: enable/disable independent irqs phy: renesas: rcar-gen3-usb2: Use pdev's device pointer on dev_vdbg() phy: rcar-gen3-usb2: Add support for r8a77470 phy: renesas: rcar-gen3-usb2: follow the hardware manual procedure phy: renesas: rcar-gen3-usb2: add is_otg_channel to use "role" sysfs phy: renesas: rcar-gen3-usb2: change a condition "dr_mode" phy: renesas: rcar-gen3-usb2: add conditions for uses_otg_pins == false phy: renesas: rcar-gen3-usb2: unify OBINTEN handling phy: renesas: rcar-gen3-usb2: Check a property to use otg pins phy: renesas: rcar-gen3-usb2: Rename has_otg_pins to uses_otg_pins phy: renesas: rcar-gen3-usb2: fix vbus_ctrl for role sysfs arm64: dts: renesas: cat875: Add CAN support arm64: dts: renesas: r8a774c0: Add clkp2 clock to CAN nodes arm64: dts: renesas: r8a774c0: Add CAN nodes arm64: dts: renesas: r8a774c0: Fix cpu nodes style arm64: dts: renesas: r8a774c0: Add OPPs table for cpu devices clk: renesas: rcar-gen3: Remove unused variable clk: renesas: rcar-gen3: Fix cpg_sd_clock_round_rate() return value clk: renesas: rcar-gen3: Correct parent clock of Audio-DMAC clk: renesas: rcar-gen3: Correct parent clock of SYS-DMAC clk: renesas: rcar-gen3: Correct parent clock of HS-USB clk: renesas: rcar-gen3: Correct parent clock of EHCI/OHCI clk: renesas: r8a774c0: Add Z2 clock clk: renesas: rcar-gen3: Support Z and Z2 clocks with high frequency parents math64: New DIV64_U64_ROUND_CLOSEST helper clk: renesas: rcar-gen3: Remove CLK_TYPE_GEN3_Z2 clk: renesas: rcar-gen3: Parameterise Z and Z2 clock offset clk: renesas: rcar-gen3: Parameterise Z and Z2 clock fixed divisor clk: renesas: rcar-gen3: Pass name/offset to cpg_sd_clk_register() clk: renesas: r8a774a1: Fix LAST_DT_CORE_CLK clk: renesas: rcar-gen3: Add spinlock clk: renesas: rcar-gen3: Factor out cpg_reg_modify() clk: renesas: r8a774a1: Add missing CANFD clock clk: renesas: Remove usage of CLK_IS_BASIC clk: renesas: rcar-gen3: Add HS400 quirk for SD clock clk: renesas: rcar-gen3: Add documentation for SD clocks clk: renesas: rcar-gen3: Set state when registering SD clocks clk: renesas: r8a774a1: Add CPEX clock CIP: Bump version suffix to -cip6 after merge from stable Add gitlab-ci.yaml CIP: Bump version suffix to -cip5 after merge from stable CIP: Bump version suffix to -cip4 after merge from stable CIP: Bump version suffix to -cip3 after merge from stable dt-bindings: Add vendor prefix for Silicon Linux. CIP: Bump version suffix to -cip2 after Renesas patches arm64: defconfig: Enable R-Car thermal driver arm64: dts: renesas: r8a774c0: Add thermal support dt-bindings: thermal: rcar-thermal: add R8A774C0 support thermal: rcar_thermal: add R8A774C0 support arm64: dts: renesas: r8a774c0: Connect RZ/G2E Audio-DMAC to IPMMU arm64: dts: renesas: r8a774c0: Connect RZ/G2E AVB to IPMMU arm64: dts: renesas: r8a774c0: Connect RZ/G2E SYS-DMAC to IPMMU arm64: dts: renesas: r8a774c0: Add PWM support dt-bindings: pwm: rcar: Add r8a774c0 support dt-bindings: pwm: rcar: Add r8a774a1 support arm64: dts: renesas: r8a774c0: Add audio support ASoC: rsnd: Add r8a774c0 support ASoC: rsnd: Add r8a774a1 support arm64: dts: renesas: r8a774c0: Add VIN and CSI-2 device nodes media: dt-bindings: rcar-csi2: Add r8a774c0 media: dt-bindings: rcar-vin: Add R8A774C0 support media: rcar-csi2: Add support for RZ/G2E media: rcar-csi2: Fix PHTW table values for E3/V3M media: rcar-csi2: Handle per-SoC number of channels media: rcar: rcar-csi2: Update V3M/E3 PHTW tables media: rcar-csi2: Add R8A77990 support media: rcar-vin: Add support for RZ/G2E media: rcar-vin: Add support for R-Car R8A77990 arm64: dts: renesas: r8a774c0: Add IPMMU device nodes dt-bindings: iommu: ipmmu-vmsa: Add r8a774c0 support dt-bindings: iommu: ipmmu-vmsa: Add r8a774a1 support iommu/ipmmu-vmsa: Hook up r8a774c0 DT matching code iommu/ipmmu-vmsa: Modify ipmmu_slave_whitelist() to check SoC revisions iommu/ipmmu-vmsa: Hook up R8A774A1 DT maching code arm64: dts: renesas: r8a774c0: Add USB3.0 device nodes usb: gadget: udc: renesas_usb3: Add bindings for r8a774c0 usb: gadget: udc: renesas_usb3: Add r8a774a1 support usb: gadget: udc: renesas_usb3: add support for r8a774c0 usb: gadget: udc: renesas_usb3: add a safety connection way for forced_b_device usb: gadget: udc: renesas_usb3: add support for r8a77990 arm64: dts: renesas: r8a774c0: Add USB-DMAC and HSUSB device nodes dt-bindings: dmaengine: usb-dmac: Add binding for r8a774c0 dt-bindings: usb: renesas_usbhs: Add r8a774c0 support dt-bindings: usb: renesas_usbhs: add clock-names property Revert "usb: renesas_usbhs: add extcon notifier to set mode for non-otg channel" usb: renesas_usbhs: Add multiple clocks management usb: renesas_usbhs: Add reset_control usb: renesas_usbhs: add support for RZ/G2E arm64: dts: renesas: r8a774c0: Add USB2.0 phy and host device nodes dt-bindings: rcar-gen3-phy-usb2: Add r8a774c0 support dt-bindings: rcar-gen3-phy-usb2: Add r8a774a1 support arm64: renesas: Enable GPIOLIB to allow GPIO driver selection arm64: enable CMT/TMU support for Renesas SoC clocksource/drivers/sh_tmu: Convert to SPDX identifiers arm64: dts: renesas: r8a774c0: Add TMU device nodes dt-bindings: timer: renesas: tmu: Document r8a774c0 bindings clk: renesas: r8a774c0: Fix LAST_DT_CORE_CLK clk: renesas: r8a774c0: Add TMU clock clk: renesas: r8a774c0: Correct parent clock of DU clk: renesas: r8a774c0: Add missing CANFD clock arm64: dts: renesas: r8a774c0: Add CMT device nodes dt-bindings: timer: renesas, cmt: Document r8a774c0 CMT support dt-bindings: timer: renesas, cmt: Document r8a774a1 CMT support clocksource/drivers/sh_cmt: Add R-Car gen3 support dt-bindings: timer: renesas: cmt: document R-Car gen3 support clocksource/drivers/sh_cmt: Properly line-wrap sh_cmt_of_table[] initializer clocksource/drivers/sh_cmt: Fix clocksource width for 32-bit machines clocksource/drivers/sh_cmt: Fixup for 64-bit machines clocksource/drivers/sh_cmt: Convert to SPDX identifiers pinctrl: sh-pfc: r8a77990: Add DRIF pins, groups and functions pinctrl: sh-pfc: r8a77990: Add TMU pins, groups and functions pinctrl: sh-pfc: r8a77990: GP6_9 does not have pull-down capability pinctrl: sh-pfc: r8a77990: Fix MOD_SEL bit numbering pinctrl: sh-pfc: r8a77990: Fix MOD_SEL0 bit2 when using RX2, TX2 and SCK2 pinctrl: sh-pfc: r8a77990: Fix MOD_SEL0 bit3 when using TX0 pinctrl: sh-pfc: r8a77990: Fix MOD_SEL0 SEL_I2C1 field width pinctrl: sh-pfc: r8a77990: Fix IOCTRL reg state after s2ram on R-Car E3 pinctrl: sh-pfc: r8a77990: Add CAN FD pins, groups and functions pinctrl: sh-pfc: r8a77990: Add CAN pins, groups and functions arm64: dts: renesas: cat875: Enable PCIe support arm64: dts: renesas: r8a774c0-cat874: Add pciec0 support arm64: dts: renesas: r8a774c0: Add PCIe device node dt-bindings: PCI: rcar: Add device tree support for r8a774c0 arm64: dts: renesas: r8a774c0: Add MSIOF nodes spi: sh-msiof: Add r8a774c0 support spi: sh-msiof: Add r8a774a1 support arm64: dts: renesas: r8a774c0: Add I2C and IIC-DVFS support dt-bindings: i2c: rcar: Add r8a774c0 support i2c: sh_mobile: Add support for r8a774c0 (RZ/G2E) i2c: sh_mobile: add support for r8a77990 (R-Car E3) dt-bindings: i2c: sh_mobile: Add r8a774c0 support i2c: sh_mobile: document support for r8a77990 (R-Car E3) pinctrl: sh-pfc: r8a77990: Add HSCIF pins, groups, and functions pinctrl: sh-pfc: r8a77990: Add VIN[4|5] groups/functions pinctrl: sh-pfc: Add optional arg to VIN_DATA_PIN_GROUP pinctrl: sh-pfc: Reduce kernel size for narrow VIN channels arm64: dts: renesas: r8a774c0: Add watchdog support dt-bindings: watchdog: renesas-wdt: Document r8a774c0 support arm64: dts: renesas: cat875: Add ethernet support arm64: dts: renesas: r8a774c0: Add Ethernet AVB node dt-bindings: net: ravb: Add support for r8a774c0 SoC arm64: dts: renesas: r8a774c0-cat874: Add uSD support arm64: dts: renesas: r8a774c0: Add SDHI nodes mmc: renesas_sdhi_internal_dmac: Whitelist r8a774c0 dt-bindings: mmc: renesas_sdhi: Add r8a774c0 support dt-bindings: mmc: renesas_sdhi: Add r8a77470 support mmc: renesas_sdhi_internal_dmac: Whitelist r8a774a1 mmc: renesas_sdhi: Add r8a774a1 support pinctrl: sh-pfc: r8a77990: Add voltage switch operations for SDHI pinctrl: sh-pfc: r8a77990: Add SDHI pins, groups and functions pinctrl: sh-pfc: r8a77990: Add Audio SSI pins, groups and functions pinctrl: sh-pfc: r8a77990: Add Audio clock pins, groups and functions arm64: dts: renesas: r8a774c0-cat874: Add pincontrol support to scif2 arm64: dts: renesas: r8a774c0: Add GPIO device nodes dt-bindings: gpio: rcar: Add r8a774c0 (RZ/G2E) support dt-bindings: gpio: rcar: Add r8a774a1 (RZ/G2M) support arm64: dts: renesas: r8a774c0: Add PFC support arm64: dts: renesas: r8a774c0: Add INTC-EX device node pinctrl: sh-pfc: r8a77990: Add INTC-EX pins, groups and function pinctrl: sh-pfc: rcar: Rename automotive-only arrays to automotive arm64: dts: renesas: r8a774c0: Add secondary CA53 CPU core clk: renesas: cpg-mssr: Add r8a774c0 support dt-bindings: clock: renesas: cpg-mssr: Document r8a774c0 clk: renesas: cpg-mssr: Add r8a774a1 support clk: renesas: rcar-gen3: Add support for mode pin clock selection clk: renesas: rcar-gen3: Add support for RCKSEL clock selection clk: renesas: cpg-mssr: Add support for fixed rate clocks clk: renesas: rcar-gen3: Add support for OSC EXTAL predivider clk: renesas: Add r8a774a1 CPG Core Clock Definitions clk: renesas: Add r8a774c0 CPG Core Clock Definitions arm64: dts: renesas: r8a774c0: Add SCIF and HSCIF nodes dt-bindings: serial: sh-sci: Document r8a774c0 bindings dt-bindings: serial: sh-sci: Document r8a774a1 bindings arm64: dts: renesas: r8a774c0: Add SYS-DMAC controller nodes dmaengine: rcar-dmac: Document R8A774C0 bindings dmaengine: rcar-dmac: Document R8A774A1 bindings arm64: dts: renesas: Add Si-Linux EK874 board support arm64: dts: renesas: Add Si-Linux CAT874 board support arm64: dts: renesas: Initial device tree for r8a774c0 dt-bindings: arm: Add si-linux cat87[45] boards ARM: dts: socfpga: Rename socfpga_cyclone5_de0_{sockit, nano_soc} dt-bindings: irqchip: renesas-irqc: Document r8a774c0 support soc: renesas: rcar-rst: Add support for RZ/G2E dt-bindings: reset: rcar-rst: Document r8a774c0 rst soc: renesas: rcar-rst: Add support for RZ/G2M soc: renesas: rcar-sysc: Add r8a774c0 support dt-bindings: power: rcar-sysc: Document r8a774c0 sysc soc: renesas: rcar-sysc: Add r8a774a1 support dt-bindings: power: Add r8a774c0 SYSC power domain definitions dt-bindings: power: Add r8a774a1 SYSC power domain definitions arm64: defconfig: enable R8A774C0 SoC arm64: defconfig: enable R8A774A1 SoC arm64: Add Renesas R8A774C0 support arm64: Add Renesas R8A774A1 support soc: renesas: Identify RZ/G2E soc: renesas: Identify RZ/G2M dt-bindings: arm: Fix RZ/G2E part number dt-bindings: arm: Document RZ/G2E SoC DT bindings dt-bindings: arm: Document RZ/G2M SoC DT bindings pinctrl: sh-pfc: r8a77990: Add R8A774C0 PFC support pinctrl: sh-pfc: r8a77990: Add MSIOF pins, groups and functions pinctrl: sh-pfc: r8a77990: Add DU pins, groups and function pinctrl: sh-pfc: r8a77990: Add PWM pins, groups and functions dt-bindings: pinctrl: sh-pfc: Document r8a774c0 PFC support pinctrl: sh-pfc: r8a7796: Add R8A774A1 PFC support dt-bindings: pinctrl: sh-pfc: Document r8a774a1 PFC support CIP: Add a number to the version suffix Conflicts: Documentation/devicetree/bindings/i2c/i2c-rcar.txt Documentation/devicetree/bindings/i2c/i2c-sh_mobile.txt Documentation/devicetree/bindings/usb/renesas_usb3.txt Documentation/devicetree/bindings/usb/renesas_usbhs.txt Documentation/devicetree/bindings/watchdog/renesas-wdt.txt arch/arm64/boot/dts/vendor/bindings/display/panel/advantech,idk-1110wr.txt arch/arm64/boot/dts/vendor/bindings/display/panel/advantech,idk-2121wr.yaml arch/arm64/boot/dts/vendor/bindings/i2c/i2c-rcar.txt arch/arm64/boot/dts/vendor/bindings/i2c/i2c-sh_mobile.txt arch/arm64/boot/dts/vendor/bindings/i2c/renesas,i2c.txt arch/arm64/boot/dts/vendor/bindings/i2c/renesas,iic.txt arch/arm64/boot/dts/vendor/bindings/media/i2c/imx219.yaml arch/arm64/boot/dts/vendor/bindings/memory-controllers/renesas,rpc-if.yaml arch/arm64/boot/dts/vendor/bindings/pci/rcar-pci-ep.yaml arch/arm64/boot/dts/vendor/bindings/usb/renesas,usb3-peri.txt arch/arm64/boot/dts/vendor/bindings/usb/renesas,usbhs.txt arch/arm64/boot/dts/vendor/bindings/usb/renesas_usb3.txt arch/arm64/boot/dts/vendor/bindings/usb/renesas_usbhs.txt arch/arm64/boot/dts/vendor/bindings/usb/ti,hd3ss3220.txt arch/arm64/boot/dts/vendor/bindings/watchdog/renesas,wdt.txt arch/arm64/boot/dts/vendor/bindings/watchdog/renesas-wdt.txt drivers/clk/qcom/clk-alpha-pll.c drivers/hid/hid-ids.h drivers/irqchip/irq-gic-v3.c drivers/media/platform/qcom/venus/hfi_parser.c drivers/mmc/host/sdhci.h drivers/platform/x86/intel_cht_int33fe.c drivers/slimbus/messaging.c drivers/usb/dwc3/core.c drivers/usb/dwc3/gadget.c drivers/usb/gadget/function/f_fs.c drivers/usb/typec/mux.c fs/ext4/dir.c kernel/time/posix-timers.c mm/oom_kill.c Change-Id: I6ccf7ce22c6636030db6245952c67bfa54aef5a4
2855 lines
86 KiB
C
2855 lines
86 KiB
C
/*
|
|
* mm/page-writeback.c
|
|
*
|
|
* Copyright (C) 2002, Linus Torvalds.
|
|
* Copyright (C) 2007 Red Hat, Inc., Peter Zijlstra
|
|
*
|
|
* Contains functions related to writing back dirty pages at the
|
|
* address_space level.
|
|
*
|
|
* 10Apr2002 Andrew Morton
|
|
* Initial version
|
|
*/
|
|
|
|
#include <linux/kernel.h>
|
|
#include <linux/export.h>
|
|
#include <linux/spinlock.h>
|
|
#include <linux/fs.h>
|
|
#include <linux/mm.h>
|
|
#include <linux/swap.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/pagemap.h>
|
|
#include <linux/writeback.h>
|
|
#include <linux/init.h>
|
|
#include <linux/backing-dev.h>
|
|
#include <linux/task_io_accounting_ops.h>
|
|
#include <linux/blkdev.h>
|
|
#include <linux/mpage.h>
|
|
#include <linux/rmap.h>
|
|
#include <linux/percpu.h>
|
|
#include <linux/smp.h>
|
|
#include <linux/sysctl.h>
|
|
#include <linux/cpu.h>
|
|
#include <linux/syscalls.h>
|
|
#include <linux/buffer_head.h> /* __set_page_dirty_buffers */
|
|
#include <linux/pagevec.h>
|
|
#include <linux/timer.h>
|
|
#include <linux/sched/rt.h>
|
|
#include <linux/sched/signal.h>
|
|
#include <linux/mm_inline.h>
|
|
#include <trace/events/writeback.h>
|
|
|
|
#include "internal.h"
|
|
|
|
/*
|
|
* Sleep at most 200ms at a time in balance_dirty_pages().
|
|
*/
|
|
#define MAX_PAUSE max(HZ/5, 1)
|
|
|
|
/*
|
|
* Try to keep balance_dirty_pages() call intervals higher than this many pages
|
|
* by raising pause time to max_pause when falls below it.
|
|
*/
|
|
#define DIRTY_POLL_THRESH (128 >> (PAGE_SHIFT - 10))
|
|
|
|
/*
|
|
* Estimate write bandwidth at 200ms intervals.
|
|
*/
|
|
#define BANDWIDTH_INTERVAL max(HZ/5, 1)
|
|
|
|
#define RATELIMIT_CALC_SHIFT 10
|
|
|
|
/*
|
|
* After a CPU has dirtied this many pages, balance_dirty_pages_ratelimited
|
|
* will look to see if it needs to force writeback or throttling.
|
|
*/
|
|
static long ratelimit_pages = 32;
|
|
|
|
/* The following parameters are exported via /proc/sys/vm */
|
|
|
|
/*
|
|
* Start background writeback (via writeback threads) at this percentage
|
|
*/
|
|
int dirty_background_ratio = 10;
|
|
|
|
/*
|
|
* dirty_background_bytes starts at 0 (disabled) so that it is a function of
|
|
* dirty_background_ratio * the amount of dirtyable memory
|
|
*/
|
|
unsigned long dirty_background_bytes;
|
|
|
|
/*
|
|
* free highmem will not be subtracted from the total free memory
|
|
* for calculating free ratios if vm_highmem_is_dirtyable is true
|
|
*/
|
|
int vm_highmem_is_dirtyable;
|
|
|
|
/*
|
|
* The generator of dirty data starts writeback at this percentage
|
|
*/
|
|
int vm_dirty_ratio = 20;
|
|
|
|
/*
|
|
* vm_dirty_bytes starts at 0 (disabled) so that it is a function of
|
|
* vm_dirty_ratio * the amount of dirtyable memory
|
|
*/
|
|
unsigned long vm_dirty_bytes;
|
|
|
|
/*
|
|
* The interval between `kupdate'-style writebacks
|
|
*/
|
|
unsigned int dirty_writeback_interval = 5 * 100; /* centiseconds */
|
|
|
|
EXPORT_SYMBOL_GPL(dirty_writeback_interval);
|
|
|
|
/*
|
|
* The longest time for which data is allowed to remain dirty
|
|
*/
|
|
unsigned int dirty_expire_interval = 30 * 100; /* centiseconds */
|
|
|
|
/*
|
|
* Flag that makes the machine dump writes/reads and block dirtyings.
|
|
*/
|
|
int block_dump;
|
|
|
|
/*
|
|
* Flag that puts the machine in "laptop mode". Doubles as a timeout in jiffies:
|
|
* a full sync is triggered after this time elapses without any disk activity.
|
|
*/
|
|
int laptop_mode;
|
|
|
|
EXPORT_SYMBOL(laptop_mode);
|
|
|
|
/* End of sysctl-exported parameters */
|
|
|
|
struct wb_domain global_wb_domain;
|
|
|
|
/* consolidated parameters for balance_dirty_pages() and its subroutines */
|
|
struct dirty_throttle_control {
|
|
#ifdef CONFIG_CGROUP_WRITEBACK
|
|
struct wb_domain *dom;
|
|
struct dirty_throttle_control *gdtc; /* only set in memcg dtc's */
|
|
#endif
|
|
struct bdi_writeback *wb;
|
|
struct fprop_local_percpu *wb_completions;
|
|
|
|
unsigned long avail; /* dirtyable */
|
|
unsigned long dirty; /* file_dirty + write + nfs */
|
|
unsigned long thresh; /* dirty threshold */
|
|
unsigned long bg_thresh; /* dirty background threshold */
|
|
|
|
unsigned long wb_dirty; /* per-wb counterparts */
|
|
unsigned long wb_thresh;
|
|
unsigned long wb_bg_thresh;
|
|
|
|
unsigned long pos_ratio;
|
|
};
|
|
|
|
/*
|
|
* Length of period for aging writeout fractions of bdis. This is an
|
|
* arbitrarily chosen number. The longer the period, the slower fractions will
|
|
* reflect changes in current writeout rate.
|
|
*/
|
|
#define VM_COMPLETIONS_PERIOD_LEN (3*HZ)
|
|
|
|
#ifdef CONFIG_CGROUP_WRITEBACK
|
|
|
|
#define GDTC_INIT(__wb) .wb = (__wb), \
|
|
.dom = &global_wb_domain, \
|
|
.wb_completions = &(__wb)->completions
|
|
|
|
#define GDTC_INIT_NO_WB .dom = &global_wb_domain
|
|
|
|
#define MDTC_INIT(__wb, __gdtc) .wb = (__wb), \
|
|
.dom = mem_cgroup_wb_domain(__wb), \
|
|
.wb_completions = &(__wb)->memcg_completions, \
|
|
.gdtc = __gdtc
|
|
|
|
static bool mdtc_valid(struct dirty_throttle_control *dtc)
|
|
{
|
|
return dtc->dom;
|
|
}
|
|
|
|
static struct wb_domain *dtc_dom(struct dirty_throttle_control *dtc)
|
|
{
|
|
return dtc->dom;
|
|
}
|
|
|
|
static struct dirty_throttle_control *mdtc_gdtc(struct dirty_throttle_control *mdtc)
|
|
{
|
|
return mdtc->gdtc;
|
|
}
|
|
|
|
static struct fprop_local_percpu *wb_memcg_completions(struct bdi_writeback *wb)
|
|
{
|
|
return &wb->memcg_completions;
|
|
}
|
|
|
|
static void wb_min_max_ratio(struct bdi_writeback *wb,
|
|
unsigned long *minp, unsigned long *maxp)
|
|
{
|
|
unsigned long this_bw = wb->avg_write_bandwidth;
|
|
unsigned long tot_bw = atomic_long_read(&wb->bdi->tot_write_bandwidth);
|
|
unsigned long long min = wb->bdi->min_ratio;
|
|
unsigned long long max = wb->bdi->max_ratio;
|
|
|
|
/*
|
|
* @wb may already be clean by the time control reaches here and
|
|
* the total may not include its bw.
|
|
*/
|
|
if (this_bw < tot_bw) {
|
|
if (min) {
|
|
min *= this_bw;
|
|
min = div64_ul(min, tot_bw);
|
|
}
|
|
if (max < 100) {
|
|
max *= this_bw;
|
|
max = div64_ul(max, tot_bw);
|
|
}
|
|
}
|
|
|
|
*minp = min;
|
|
*maxp = max;
|
|
}
|
|
|
|
#else /* CONFIG_CGROUP_WRITEBACK */
|
|
|
|
#define GDTC_INIT(__wb) .wb = (__wb), \
|
|
.wb_completions = &(__wb)->completions
|
|
#define GDTC_INIT_NO_WB
|
|
#define MDTC_INIT(__wb, __gdtc)
|
|
|
|
static bool mdtc_valid(struct dirty_throttle_control *dtc)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
static struct wb_domain *dtc_dom(struct dirty_throttle_control *dtc)
|
|
{
|
|
return &global_wb_domain;
|
|
}
|
|
|
|
static struct dirty_throttle_control *mdtc_gdtc(struct dirty_throttle_control *mdtc)
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
static struct fprop_local_percpu *wb_memcg_completions(struct bdi_writeback *wb)
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
static void wb_min_max_ratio(struct bdi_writeback *wb,
|
|
unsigned long *minp, unsigned long *maxp)
|
|
{
|
|
*minp = wb->bdi->min_ratio;
|
|
*maxp = wb->bdi->max_ratio;
|
|
}
|
|
|
|
#endif /* CONFIG_CGROUP_WRITEBACK */
|
|
|
|
/*
|
|
* In a memory zone, there is a certain amount of pages we consider
|
|
* available for the page cache, which is essentially the number of
|
|
* free and reclaimable pages, minus some zone reserves to protect
|
|
* lowmem and the ability to uphold the zone's watermarks without
|
|
* requiring writeback.
|
|
*
|
|
* This number of dirtyable pages is the base value of which the
|
|
* user-configurable dirty ratio is the effictive number of pages that
|
|
* are allowed to be actually dirtied. Per individual zone, or
|
|
* globally by using the sum of dirtyable pages over all zones.
|
|
*
|
|
* Because the user is allowed to specify the dirty limit globally as
|
|
* absolute number of bytes, calculating the per-zone dirty limit can
|
|
* require translating the configured limit into a percentage of
|
|
* global dirtyable memory first.
|
|
*/
|
|
|
|
/**
|
|
* node_dirtyable_memory - number of dirtyable pages in a node
|
|
* @pgdat: the node
|
|
*
|
|
* Returns the node's number of pages potentially available for dirty
|
|
* page cache. This is the base value for the per-node dirty limits.
|
|
*/
|
|
static unsigned long node_dirtyable_memory(struct pglist_data *pgdat)
|
|
{
|
|
unsigned long nr_pages = 0;
|
|
int z;
|
|
|
|
for (z = 0; z < MAX_NR_ZONES; z++) {
|
|
struct zone *zone = pgdat->node_zones + z;
|
|
|
|
if (!populated_zone(zone))
|
|
continue;
|
|
|
|
nr_pages += zone_page_state(zone, NR_FREE_PAGES);
|
|
}
|
|
|
|
/*
|
|
* Pages reserved for the kernel should not be considered
|
|
* dirtyable, to prevent a situation where reclaim has to
|
|
* clean pages in order to balance the zones.
|
|
*/
|
|
nr_pages -= min(nr_pages, pgdat->totalreserve_pages);
|
|
|
|
nr_pages += node_page_state(pgdat, NR_INACTIVE_FILE);
|
|
nr_pages += node_page_state(pgdat, NR_ACTIVE_FILE);
|
|
|
|
return nr_pages;
|
|
}
|
|
|
|
static unsigned long highmem_dirtyable_memory(unsigned long total)
|
|
{
|
|
#ifdef CONFIG_HIGHMEM
|
|
int node;
|
|
unsigned long x = 0;
|
|
int i;
|
|
|
|
for_each_node_state(node, N_HIGH_MEMORY) {
|
|
for (i = ZONE_NORMAL + 1; i < MAX_NR_ZONES; i++) {
|
|
struct zone *z;
|
|
unsigned long nr_pages;
|
|
|
|
if (!is_highmem_idx(i))
|
|
continue;
|
|
|
|
z = &NODE_DATA(node)->node_zones[i];
|
|
if (!populated_zone(z))
|
|
continue;
|
|
|
|
nr_pages = zone_page_state(z, NR_FREE_PAGES);
|
|
/* watch for underflows */
|
|
nr_pages -= min(nr_pages, high_wmark_pages(z));
|
|
nr_pages += zone_page_state(z, NR_ZONE_INACTIVE_FILE);
|
|
nr_pages += zone_page_state(z, NR_ZONE_ACTIVE_FILE);
|
|
x += nr_pages;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Unreclaimable memory (kernel memory or anonymous memory
|
|
* without swap) can bring down the dirtyable pages below
|
|
* the zone's dirty balance reserve and the above calculation
|
|
* will underflow. However we still want to add in nodes
|
|
* which are below threshold (negative values) to get a more
|
|
* accurate calculation but make sure that the total never
|
|
* underflows.
|
|
*/
|
|
if ((long)x < 0)
|
|
x = 0;
|
|
|
|
/*
|
|
* Make sure that the number of highmem pages is never larger
|
|
* than the number of the total dirtyable memory. This can only
|
|
* occur in very strange VM situations but we want to make sure
|
|
* that this does not occur.
|
|
*/
|
|
return min(x, total);
|
|
#else
|
|
return 0;
|
|
#endif
|
|
}
|
|
|
|
/**
|
|
* global_dirtyable_memory - number of globally dirtyable pages
|
|
*
|
|
* Returns the global number of pages potentially available for dirty
|
|
* page cache. This is the base value for the global dirty limits.
|
|
*/
|
|
static unsigned long global_dirtyable_memory(void)
|
|
{
|
|
unsigned long x;
|
|
|
|
x = global_zone_page_state(NR_FREE_PAGES);
|
|
/*
|
|
* Pages reserved for the kernel should not be considered
|
|
* dirtyable, to prevent a situation where reclaim has to
|
|
* clean pages in order to balance the zones.
|
|
*/
|
|
x -= min(x, totalreserve_pages);
|
|
|
|
x += global_node_page_state(NR_INACTIVE_FILE);
|
|
x += global_node_page_state(NR_ACTIVE_FILE);
|
|
|
|
if (!vm_highmem_is_dirtyable)
|
|
x -= highmem_dirtyable_memory(x);
|
|
|
|
return x + 1; /* Ensure that we never return 0 */
|
|
}
|
|
|
|
/**
|
|
* domain_dirty_limits - calculate thresh and bg_thresh for a wb_domain
|
|
* @dtc: dirty_throttle_control of interest
|
|
*
|
|
* Calculate @dtc->thresh and ->bg_thresh considering
|
|
* vm_dirty_{bytes|ratio} and dirty_background_{bytes|ratio}. The caller
|
|
* must ensure that @dtc->avail is set before calling this function. The
|
|
* dirty limits will be lifted by 1/4 for PF_LESS_THROTTLE (ie. nfsd) and
|
|
* real-time tasks.
|
|
*/
|
|
static void domain_dirty_limits(struct dirty_throttle_control *dtc)
|
|
{
|
|
const unsigned long available_memory = dtc->avail;
|
|
struct dirty_throttle_control *gdtc = mdtc_gdtc(dtc);
|
|
unsigned long bytes = vm_dirty_bytes;
|
|
unsigned long bg_bytes = dirty_background_bytes;
|
|
/* convert ratios to per-PAGE_SIZE for higher precision */
|
|
unsigned long ratio = (vm_dirty_ratio * PAGE_SIZE) / 100;
|
|
unsigned long bg_ratio = (dirty_background_ratio * PAGE_SIZE) / 100;
|
|
unsigned long thresh;
|
|
unsigned long bg_thresh;
|
|
struct task_struct *tsk;
|
|
|
|
/* gdtc is !NULL iff @dtc is for memcg domain */
|
|
if (gdtc) {
|
|
unsigned long global_avail = gdtc->avail;
|
|
|
|
/*
|
|
* The byte settings can't be applied directly to memcg
|
|
* domains. Convert them to ratios by scaling against
|
|
* globally available memory. As the ratios are in
|
|
* per-PAGE_SIZE, they can be obtained by dividing bytes by
|
|
* number of pages.
|
|
*/
|
|
if (bytes)
|
|
ratio = min(DIV_ROUND_UP(bytes, global_avail),
|
|
PAGE_SIZE);
|
|
if (bg_bytes)
|
|
bg_ratio = min(DIV_ROUND_UP(bg_bytes, global_avail),
|
|
PAGE_SIZE);
|
|
bytes = bg_bytes = 0;
|
|
}
|
|
|
|
if (bytes)
|
|
thresh = DIV_ROUND_UP(bytes, PAGE_SIZE);
|
|
else
|
|
thresh = (ratio * available_memory) / PAGE_SIZE;
|
|
|
|
if (bg_bytes)
|
|
bg_thresh = DIV_ROUND_UP(bg_bytes, PAGE_SIZE);
|
|
else
|
|
bg_thresh = (bg_ratio * available_memory) / PAGE_SIZE;
|
|
|
|
tsk = current;
|
|
if (tsk->flags & PF_LESS_THROTTLE || rt_task(tsk)) {
|
|
bg_thresh += bg_thresh / 4 + global_wb_domain.dirty_limit / 32;
|
|
thresh += thresh / 4 + global_wb_domain.dirty_limit / 32;
|
|
}
|
|
/*
|
|
* Dirty throttling logic assumes the limits in page units fit into
|
|
* 32-bits. This gives 16TB dirty limits max which is hopefully enough.
|
|
*/
|
|
if (thresh > UINT_MAX)
|
|
thresh = UINT_MAX;
|
|
/* This makes sure bg_thresh is within 32-bits as well */
|
|
if (bg_thresh >= thresh)
|
|
bg_thresh = thresh / 2;
|
|
dtc->thresh = thresh;
|
|
dtc->bg_thresh = bg_thresh;
|
|
|
|
/* we should eventually report the domain in the TP */
|
|
if (!gdtc)
|
|
trace_global_dirty_state(bg_thresh, thresh);
|
|
}
|
|
|
|
/**
|
|
* global_dirty_limits - background-writeback and dirty-throttling thresholds
|
|
* @pbackground: out parameter for bg_thresh
|
|
* @pdirty: out parameter for thresh
|
|
*
|
|
* Calculate bg_thresh and thresh for global_wb_domain. See
|
|
* domain_dirty_limits() for details.
|
|
*/
|
|
void global_dirty_limits(unsigned long *pbackground, unsigned long *pdirty)
|
|
{
|
|
struct dirty_throttle_control gdtc = { GDTC_INIT_NO_WB };
|
|
|
|
gdtc.avail = global_dirtyable_memory();
|
|
domain_dirty_limits(&gdtc);
|
|
|
|
*pbackground = gdtc.bg_thresh;
|
|
*pdirty = gdtc.thresh;
|
|
}
|
|
|
|
/**
|
|
* node_dirty_limit - maximum number of dirty pages allowed in a node
|
|
* @pgdat: the node
|
|
*
|
|
* Returns the maximum number of dirty pages allowed in a node, based
|
|
* on the node's dirtyable memory.
|
|
*/
|
|
static unsigned long node_dirty_limit(struct pglist_data *pgdat)
|
|
{
|
|
unsigned long node_memory = node_dirtyable_memory(pgdat);
|
|
struct task_struct *tsk = current;
|
|
unsigned long dirty;
|
|
|
|
if (vm_dirty_bytes)
|
|
dirty = DIV_ROUND_UP(vm_dirty_bytes, PAGE_SIZE) *
|
|
node_memory / global_dirtyable_memory();
|
|
else
|
|
dirty = vm_dirty_ratio * node_memory / 100;
|
|
|
|
if (tsk->flags & PF_LESS_THROTTLE || rt_task(tsk))
|
|
dirty += dirty / 4;
|
|
|
|
/*
|
|
* Dirty throttling logic assumes the limits in page units fit into
|
|
* 32-bits. This gives 16TB dirty limits max which is hopefully enough.
|
|
*/
|
|
return min_t(unsigned long, dirty, UINT_MAX);
|
|
}
|
|
|
|
/**
|
|
* node_dirty_ok - tells whether a node is within its dirty limits
|
|
* @pgdat: the node to check
|
|
*
|
|
* Returns %true when the dirty pages in @pgdat are within the node's
|
|
* dirty limit, %false if the limit is exceeded.
|
|
*/
|
|
bool node_dirty_ok(struct pglist_data *pgdat)
|
|
{
|
|
unsigned long limit = node_dirty_limit(pgdat);
|
|
unsigned long nr_pages = 0;
|
|
|
|
nr_pages += node_page_state(pgdat, NR_FILE_DIRTY);
|
|
nr_pages += node_page_state(pgdat, NR_UNSTABLE_NFS);
|
|
nr_pages += node_page_state(pgdat, NR_WRITEBACK);
|
|
|
|
return nr_pages <= limit;
|
|
}
|
|
|
|
int dirty_background_ratio_handler(struct ctl_table *table, int write,
|
|
void *buffer, size_t *lenp, loff_t *ppos)
|
|
{
|
|
int ret;
|
|
|
|
ret = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
|
|
if (ret == 0 && write)
|
|
dirty_background_bytes = 0;
|
|
return ret;
|
|
}
|
|
|
|
int dirty_background_bytes_handler(struct ctl_table *table, int write,
|
|
void *buffer, size_t *lenp, loff_t *ppos)
|
|
{
|
|
int ret;
|
|
unsigned long old_bytes = dirty_background_bytes;
|
|
|
|
ret = proc_doulongvec_minmax(table, write, buffer, lenp, ppos);
|
|
if (ret == 0 && write) {
|
|
if (DIV_ROUND_UP(dirty_background_bytes, PAGE_SIZE) >
|
|
UINT_MAX) {
|
|
dirty_background_bytes = old_bytes;
|
|
return -ERANGE;
|
|
}
|
|
dirty_background_ratio = 0;
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
int dirty_ratio_handler(struct ctl_table *table, int write, void *buffer,
|
|
size_t *lenp, loff_t *ppos)
|
|
{
|
|
int old_ratio = vm_dirty_ratio;
|
|
int ret;
|
|
|
|
ret = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
|
|
if (ret == 0 && write && vm_dirty_ratio != old_ratio) {
|
|
vm_dirty_bytes = 0;
|
|
writeback_set_ratelimit();
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
int dirty_bytes_handler(struct ctl_table *table, int write,
|
|
void *buffer, size_t *lenp, loff_t *ppos)
|
|
{
|
|
unsigned long old_bytes = vm_dirty_bytes;
|
|
int ret;
|
|
|
|
ret = proc_doulongvec_minmax(table, write, buffer, lenp, ppos);
|
|
if (ret == 0 && write && vm_dirty_bytes != old_bytes) {
|
|
if (DIV_ROUND_UP(vm_dirty_bytes, PAGE_SIZE) > UINT_MAX) {
|
|
vm_dirty_bytes = old_bytes;
|
|
return -ERANGE;
|
|
}
|
|
writeback_set_ratelimit();
|
|
vm_dirty_ratio = 0;
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
static unsigned long wp_next_time(unsigned long cur_time)
|
|
{
|
|
cur_time += VM_COMPLETIONS_PERIOD_LEN;
|
|
/* 0 has a special meaning... */
|
|
if (!cur_time)
|
|
return 1;
|
|
return cur_time;
|
|
}
|
|
|
|
static void wb_domain_writeout_inc(struct wb_domain *dom,
|
|
struct fprop_local_percpu *completions,
|
|
unsigned int max_prop_frac)
|
|
{
|
|
__fprop_inc_percpu_max(&dom->completions, completions,
|
|
max_prop_frac);
|
|
/* First event after period switching was turned off? */
|
|
if (unlikely(!dom->period_time)) {
|
|
/*
|
|
* We can race with other __bdi_writeout_inc calls here but
|
|
* it does not cause any harm since the resulting time when
|
|
* timer will fire and what is in writeout_period_time will be
|
|
* roughly the same.
|
|
*/
|
|
dom->period_time = wp_next_time(jiffies);
|
|
mod_timer(&dom->period_timer, dom->period_time);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Increment @wb's writeout completion count and the global writeout
|
|
* completion count. Called from test_clear_page_writeback().
|
|
*/
|
|
static inline void __wb_writeout_inc(struct bdi_writeback *wb)
|
|
{
|
|
struct wb_domain *cgdom;
|
|
|
|
inc_wb_stat(wb, WB_WRITTEN);
|
|
wb_domain_writeout_inc(&global_wb_domain, &wb->completions,
|
|
wb->bdi->max_prop_frac);
|
|
|
|
cgdom = mem_cgroup_wb_domain(wb);
|
|
if (cgdom)
|
|
wb_domain_writeout_inc(cgdom, wb_memcg_completions(wb),
|
|
wb->bdi->max_prop_frac);
|
|
}
|
|
|
|
void wb_writeout_inc(struct bdi_writeback *wb)
|
|
{
|
|
unsigned long flags;
|
|
|
|
local_irq_save(flags);
|
|
__wb_writeout_inc(wb);
|
|
local_irq_restore(flags);
|
|
}
|
|
EXPORT_SYMBOL_GPL(wb_writeout_inc);
|
|
|
|
/*
|
|
* On idle system, we can be called long after we scheduled because we use
|
|
* deferred timers so count with missed periods.
|
|
*/
|
|
static void writeout_period(struct timer_list *t)
|
|
{
|
|
struct wb_domain *dom = from_timer(dom, t, period_timer);
|
|
int miss_periods = (jiffies - dom->period_time) /
|
|
VM_COMPLETIONS_PERIOD_LEN;
|
|
|
|
if (fprop_new_period(&dom->completions, miss_periods + 1)) {
|
|
dom->period_time = wp_next_time(dom->period_time +
|
|
miss_periods * VM_COMPLETIONS_PERIOD_LEN);
|
|
mod_timer(&dom->period_timer, dom->period_time);
|
|
} else {
|
|
/*
|
|
* Aging has zeroed all fractions. Stop wasting CPU on period
|
|
* updates.
|
|
*/
|
|
dom->period_time = 0;
|
|
}
|
|
}
|
|
|
|
int wb_domain_init(struct wb_domain *dom, gfp_t gfp)
|
|
{
|
|
memset(dom, 0, sizeof(*dom));
|
|
|
|
spin_lock_init(&dom->lock);
|
|
|
|
timer_setup(&dom->period_timer, writeout_period, TIMER_DEFERRABLE);
|
|
|
|
dom->dirty_limit_tstamp = jiffies;
|
|
|
|
return fprop_global_init(&dom->completions, gfp);
|
|
}
|
|
|
|
#ifdef CONFIG_CGROUP_WRITEBACK
|
|
void wb_domain_exit(struct wb_domain *dom)
|
|
{
|
|
del_timer_sync(&dom->period_timer);
|
|
fprop_global_destroy(&dom->completions);
|
|
}
|
|
#endif
|
|
|
|
/*
|
|
* bdi_min_ratio keeps the sum of the minimum dirty shares of all
|
|
* registered backing devices, which, for obvious reasons, can not
|
|
* exceed 100%.
|
|
*/
|
|
static unsigned int bdi_min_ratio;
|
|
|
|
int bdi_set_min_ratio(struct backing_dev_info *bdi, unsigned int min_ratio)
|
|
{
|
|
int ret = 0;
|
|
|
|
spin_lock_bh(&bdi_lock);
|
|
if (min_ratio > bdi->max_ratio) {
|
|
ret = -EINVAL;
|
|
} else {
|
|
min_ratio -= bdi->min_ratio;
|
|
if (bdi_min_ratio + min_ratio < 100) {
|
|
bdi_min_ratio += min_ratio;
|
|
bdi->min_ratio += min_ratio;
|
|
} else {
|
|
ret = -EINVAL;
|
|
}
|
|
}
|
|
spin_unlock_bh(&bdi_lock);
|
|
|
|
return ret;
|
|
}
|
|
|
|
int bdi_set_max_ratio(struct backing_dev_info *bdi, unsigned max_ratio)
|
|
{
|
|
int ret = 0;
|
|
|
|
if (max_ratio > 100)
|
|
return -EINVAL;
|
|
|
|
spin_lock_bh(&bdi_lock);
|
|
if (bdi->min_ratio > max_ratio) {
|
|
ret = -EINVAL;
|
|
} else {
|
|
bdi->max_ratio = max_ratio;
|
|
bdi->max_prop_frac = (FPROP_FRAC_BASE * max_ratio) / 100;
|
|
}
|
|
spin_unlock_bh(&bdi_lock);
|
|
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(bdi_set_max_ratio);
|
|
|
|
static unsigned long dirty_freerun_ceiling(unsigned long thresh,
|
|
unsigned long bg_thresh)
|
|
{
|
|
return (thresh + bg_thresh) / 2;
|
|
}
|
|
|
|
static unsigned long hard_dirty_limit(struct wb_domain *dom,
|
|
unsigned long thresh)
|
|
{
|
|
return max(thresh, dom->dirty_limit);
|
|
}
|
|
|
|
/*
|
|
* Memory which can be further allocated to a memcg domain is capped by
|
|
* system-wide clean memory excluding the amount being used in the domain.
|
|
*/
|
|
static void mdtc_calc_avail(struct dirty_throttle_control *mdtc,
|
|
unsigned long filepages, unsigned long headroom)
|
|
{
|
|
struct dirty_throttle_control *gdtc = mdtc_gdtc(mdtc);
|
|
unsigned long clean = filepages - min(filepages, mdtc->dirty);
|
|
unsigned long global_clean = gdtc->avail - min(gdtc->avail, gdtc->dirty);
|
|
unsigned long other_clean = global_clean - min(global_clean, clean);
|
|
|
|
mdtc->avail = filepages + min(headroom, other_clean);
|
|
}
|
|
|
|
/**
|
|
* __wb_calc_thresh - @wb's share of dirty throttling threshold
|
|
* @dtc: dirty_throttle_context of interest
|
|
*
|
|
* Returns @wb's dirty limit in pages. The term "dirty" in the context of
|
|
* dirty balancing includes all PG_dirty, PG_writeback and NFS unstable pages.
|
|
*
|
|
* Note that balance_dirty_pages() will only seriously take it as a hard limit
|
|
* when sleeping max_pause per page is not enough to keep the dirty pages under
|
|
* control. For example, when the device is completely stalled due to some error
|
|
* conditions, or when there are 1000 dd tasks writing to a slow 10MB/s USB key.
|
|
* In the other normal situations, it acts more gently by throttling the tasks
|
|
* more (rather than completely block them) when the wb dirty pages go high.
|
|
*
|
|
* It allocates high/low dirty limits to fast/slow devices, in order to prevent
|
|
* - starving fast devices
|
|
* - piling up dirty pages (that will take long time to sync) on slow devices
|
|
*
|
|
* The wb's share of dirty limit will be adapting to its throughput and
|
|
* bounded by the bdi->min_ratio and/or bdi->max_ratio parameters, if set.
|
|
*/
|
|
static unsigned long __wb_calc_thresh(struct dirty_throttle_control *dtc)
|
|
{
|
|
struct wb_domain *dom = dtc_dom(dtc);
|
|
unsigned long thresh = dtc->thresh;
|
|
u64 wb_thresh;
|
|
long numerator, denominator;
|
|
unsigned long wb_min_ratio, wb_max_ratio;
|
|
|
|
/*
|
|
* Calculate this BDI's share of the thresh ratio.
|
|
*/
|
|
fprop_fraction_percpu(&dom->completions, dtc->wb_completions,
|
|
&numerator, &denominator);
|
|
|
|
wb_thresh = (thresh * (100 - bdi_min_ratio)) / 100;
|
|
wb_thresh *= numerator;
|
|
do_div(wb_thresh, denominator);
|
|
|
|
wb_min_max_ratio(dtc->wb, &wb_min_ratio, &wb_max_ratio);
|
|
|
|
wb_thresh += (thresh * wb_min_ratio) / 100;
|
|
if (wb_thresh > (thresh * wb_max_ratio) / 100)
|
|
wb_thresh = thresh * wb_max_ratio / 100;
|
|
|
|
return wb_thresh;
|
|
}
|
|
|
|
unsigned long wb_calc_thresh(struct bdi_writeback *wb, unsigned long thresh)
|
|
{
|
|
struct dirty_throttle_control gdtc = { GDTC_INIT(wb),
|
|
.thresh = thresh };
|
|
return __wb_calc_thresh(&gdtc);
|
|
}
|
|
|
|
/*
|
|
* setpoint - dirty 3
|
|
* f(dirty) := 1.0 + (----------------)
|
|
* limit - setpoint
|
|
*
|
|
* it's a 3rd order polynomial that subjects to
|
|
*
|
|
* (1) f(freerun) = 2.0 => rampup dirty_ratelimit reasonably fast
|
|
* (2) f(setpoint) = 1.0 => the balance point
|
|
* (3) f(limit) = 0 => the hard limit
|
|
* (4) df/dx <= 0 => negative feedback control
|
|
* (5) the closer to setpoint, the smaller |df/dx| (and the reverse)
|
|
* => fast response on large errors; small oscillation near setpoint
|
|
*/
|
|
static long long pos_ratio_polynom(unsigned long setpoint,
|
|
unsigned long dirty,
|
|
unsigned long limit)
|
|
{
|
|
long long pos_ratio;
|
|
long x;
|
|
|
|
x = div64_s64(((s64)setpoint - (s64)dirty) << RATELIMIT_CALC_SHIFT,
|
|
(limit - setpoint) | 1);
|
|
pos_ratio = x;
|
|
pos_ratio = pos_ratio * x >> RATELIMIT_CALC_SHIFT;
|
|
pos_ratio = pos_ratio * x >> RATELIMIT_CALC_SHIFT;
|
|
pos_ratio += 1 << RATELIMIT_CALC_SHIFT;
|
|
|
|
return clamp(pos_ratio, 0LL, 2LL << RATELIMIT_CALC_SHIFT);
|
|
}
|
|
|
|
/*
|
|
* Dirty position control.
|
|
*
|
|
* (o) global/bdi setpoints
|
|
*
|
|
* We want the dirty pages be balanced around the global/wb setpoints.
|
|
* When the number of dirty pages is higher/lower than the setpoint, the
|
|
* dirty position control ratio (and hence task dirty ratelimit) will be
|
|
* decreased/increased to bring the dirty pages back to the setpoint.
|
|
*
|
|
* pos_ratio = 1 << RATELIMIT_CALC_SHIFT
|
|
*
|
|
* if (dirty < setpoint) scale up pos_ratio
|
|
* if (dirty > setpoint) scale down pos_ratio
|
|
*
|
|
* if (wb_dirty < wb_setpoint) scale up pos_ratio
|
|
* if (wb_dirty > wb_setpoint) scale down pos_ratio
|
|
*
|
|
* task_ratelimit = dirty_ratelimit * pos_ratio >> RATELIMIT_CALC_SHIFT
|
|
*
|
|
* (o) global control line
|
|
*
|
|
* ^ pos_ratio
|
|
* |
|
|
* | |<===== global dirty control scope ======>|
|
|
* 2.0 .............*
|
|
* | .*
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* 1.0 ................................*
|
|
* | . . *
|
|
* | . . *
|
|
* | . . *
|
|
* | . . *
|
|
* | . . *
|
|
* 0 +------------.------------------.----------------------*------------->
|
|
* freerun^ setpoint^ limit^ dirty pages
|
|
*
|
|
* (o) wb control line
|
|
*
|
|
* ^ pos_ratio
|
|
* |
|
|
* | *
|
|
* | *
|
|
* | *
|
|
* | *
|
|
* | * |<=========== span ============>|
|
|
* 1.0 .......................*
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* | . *
|
|
* 1/4 ...............................................* * * * * * * * * * * *
|
|
* | . .
|
|
* | . .
|
|
* | . .
|
|
* 0 +----------------------.-------------------------------.------------->
|
|
* wb_setpoint^ x_intercept^
|
|
*
|
|
* The wb control line won't drop below pos_ratio=1/4, so that wb_dirty can
|
|
* be smoothly throttled down to normal if it starts high in situations like
|
|
* - start writing to a slow SD card and a fast disk at the same time. The SD
|
|
* card's wb_dirty may rush to many times higher than wb_setpoint.
|
|
* - the wb dirty thresh drops quickly due to change of JBOD workload
|
|
*/
|
|
static void wb_position_ratio(struct dirty_throttle_control *dtc)
|
|
{
|
|
struct bdi_writeback *wb = dtc->wb;
|
|
unsigned long write_bw = wb->avg_write_bandwidth;
|
|
unsigned long freerun = dirty_freerun_ceiling(dtc->thresh, dtc->bg_thresh);
|
|
unsigned long limit = hard_dirty_limit(dtc_dom(dtc), dtc->thresh);
|
|
unsigned long wb_thresh = dtc->wb_thresh;
|
|
unsigned long x_intercept;
|
|
unsigned long setpoint; /* dirty pages' target balance point */
|
|
unsigned long wb_setpoint;
|
|
unsigned long span;
|
|
long long pos_ratio; /* for scaling up/down the rate limit */
|
|
long x;
|
|
|
|
dtc->pos_ratio = 0;
|
|
|
|
if (unlikely(dtc->dirty >= limit))
|
|
return;
|
|
|
|
/*
|
|
* global setpoint
|
|
*
|
|
* See comment for pos_ratio_polynom().
|
|
*/
|
|
setpoint = (freerun + limit) / 2;
|
|
pos_ratio = pos_ratio_polynom(setpoint, dtc->dirty, limit);
|
|
|
|
/*
|
|
* The strictlimit feature is a tool preventing mistrusted filesystems
|
|
* from growing a large number of dirty pages before throttling. For
|
|
* such filesystems balance_dirty_pages always checks wb counters
|
|
* against wb limits. Even if global "nr_dirty" is under "freerun".
|
|
* This is especially important for fuse which sets bdi->max_ratio to
|
|
* 1% by default. Without strictlimit feature, fuse writeback may
|
|
* consume arbitrary amount of RAM because it is accounted in
|
|
* NR_WRITEBACK_TEMP which is not involved in calculating "nr_dirty".
|
|
*
|
|
* Here, in wb_position_ratio(), we calculate pos_ratio based on
|
|
* two values: wb_dirty and wb_thresh. Let's consider an example:
|
|
* total amount of RAM is 16GB, bdi->max_ratio is equal to 1%, global
|
|
* limits are set by default to 10% and 20% (background and throttle).
|
|
* Then wb_thresh is 1% of 20% of 16GB. This amounts to ~8K pages.
|
|
* wb_calc_thresh(wb, bg_thresh) is about ~4K pages. wb_setpoint is
|
|
* about ~6K pages (as the average of background and throttle wb
|
|
* limits). The 3rd order polynomial will provide positive feedback if
|
|
* wb_dirty is under wb_setpoint and vice versa.
|
|
*
|
|
* Note, that we cannot use global counters in these calculations
|
|
* because we want to throttle process writing to a strictlimit wb
|
|
* much earlier than global "freerun" is reached (~23MB vs. ~2.3GB
|
|
* in the example above).
|
|
*/
|
|
if (unlikely(wb->bdi->capabilities & BDI_CAP_STRICTLIMIT)) {
|
|
long long wb_pos_ratio;
|
|
|
|
if (dtc->wb_dirty < 8) {
|
|
dtc->pos_ratio = min_t(long long, pos_ratio * 2,
|
|
2 << RATELIMIT_CALC_SHIFT);
|
|
return;
|
|
}
|
|
|
|
if (dtc->wb_dirty >= wb_thresh)
|
|
return;
|
|
|
|
wb_setpoint = dirty_freerun_ceiling(wb_thresh,
|
|
dtc->wb_bg_thresh);
|
|
|
|
if (wb_setpoint == 0 || wb_setpoint == wb_thresh)
|
|
return;
|
|
|
|
wb_pos_ratio = pos_ratio_polynom(wb_setpoint, dtc->wb_dirty,
|
|
wb_thresh);
|
|
|
|
/*
|
|
* Typically, for strictlimit case, wb_setpoint << setpoint
|
|
* and pos_ratio >> wb_pos_ratio. In the other words global
|
|
* state ("dirty") is not limiting factor and we have to
|
|
* make decision based on wb counters. But there is an
|
|
* important case when global pos_ratio should get precedence:
|
|
* global limits are exceeded (e.g. due to activities on other
|
|
* wb's) while given strictlimit wb is below limit.
|
|
*
|
|
* "pos_ratio * wb_pos_ratio" would work for the case above,
|
|
* but it would look too non-natural for the case of all
|
|
* activity in the system coming from a single strictlimit wb
|
|
* with bdi->max_ratio == 100%.
|
|
*
|
|
* Note that min() below somewhat changes the dynamics of the
|
|
* control system. Normally, pos_ratio value can be well over 3
|
|
* (when globally we are at freerun and wb is well below wb
|
|
* setpoint). Now the maximum pos_ratio in the same situation
|
|
* is 2. We might want to tweak this if we observe the control
|
|
* system is too slow to adapt.
|
|
*/
|
|
dtc->pos_ratio = min(pos_ratio, wb_pos_ratio);
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* We have computed basic pos_ratio above based on global situation. If
|
|
* the wb is over/under its share of dirty pages, we want to scale
|
|
* pos_ratio further down/up. That is done by the following mechanism.
|
|
*/
|
|
|
|
/*
|
|
* wb setpoint
|
|
*
|
|
* f(wb_dirty) := 1.0 + k * (wb_dirty - wb_setpoint)
|
|
*
|
|
* x_intercept - wb_dirty
|
|
* := --------------------------
|
|
* x_intercept - wb_setpoint
|
|
*
|
|
* The main wb control line is a linear function that subjects to
|
|
*
|
|
* (1) f(wb_setpoint) = 1.0
|
|
* (2) k = - 1 / (8 * write_bw) (in single wb case)
|
|
* or equally: x_intercept = wb_setpoint + 8 * write_bw
|
|
*
|
|
* For single wb case, the dirty pages are observed to fluctuate
|
|
* regularly within range
|
|
* [wb_setpoint - write_bw/2, wb_setpoint + write_bw/2]
|
|
* for various filesystems, where (2) can yield in a reasonable 12.5%
|
|
* fluctuation range for pos_ratio.
|
|
*
|
|
* For JBOD case, wb_thresh (not wb_dirty!) could fluctuate up to its
|
|
* own size, so move the slope over accordingly and choose a slope that
|
|
* yields 100% pos_ratio fluctuation on suddenly doubled wb_thresh.
|
|
*/
|
|
if (unlikely(wb_thresh > dtc->thresh))
|
|
wb_thresh = dtc->thresh;
|
|
/*
|
|
* It's very possible that wb_thresh is close to 0 not because the
|
|
* device is slow, but that it has remained inactive for long time.
|
|
* Honour such devices a reasonable good (hopefully IO efficient)
|
|
* threshold, so that the occasional writes won't be blocked and active
|
|
* writes can rampup the threshold quickly.
|
|
*/
|
|
wb_thresh = max(wb_thresh, (limit - dtc->dirty) / 8);
|
|
/*
|
|
* scale global setpoint to wb's:
|
|
* wb_setpoint = setpoint * wb_thresh / thresh
|
|
*/
|
|
x = div_u64((u64)wb_thresh << 16, dtc->thresh | 1);
|
|
wb_setpoint = setpoint * (u64)x >> 16;
|
|
/*
|
|
* Use span=(8*write_bw) in single wb case as indicated by
|
|
* (thresh - wb_thresh ~= 0) and transit to wb_thresh in JBOD case.
|
|
*
|
|
* wb_thresh thresh - wb_thresh
|
|
* span = --------- * (8 * write_bw) + ------------------ * wb_thresh
|
|
* thresh thresh
|
|
*/
|
|
span = (dtc->thresh - wb_thresh + 8 * write_bw) * (u64)x >> 16;
|
|
x_intercept = wb_setpoint + span;
|
|
|
|
if (dtc->wb_dirty < x_intercept - span / 4) {
|
|
pos_ratio = div64_u64(pos_ratio * (x_intercept - dtc->wb_dirty),
|
|
(x_intercept - wb_setpoint) | 1);
|
|
} else
|
|
pos_ratio /= 4;
|
|
|
|
/*
|
|
* wb reserve area, safeguard against dirty pool underrun and disk idle
|
|
* It may push the desired control point of global dirty pages higher
|
|
* than setpoint.
|
|
*/
|
|
x_intercept = wb_thresh / 2;
|
|
if (dtc->wb_dirty < x_intercept) {
|
|
if (dtc->wb_dirty > x_intercept / 8)
|
|
pos_ratio = div_u64(pos_ratio * x_intercept,
|
|
dtc->wb_dirty);
|
|
else
|
|
pos_ratio *= 8;
|
|
}
|
|
|
|
dtc->pos_ratio = pos_ratio;
|
|
}
|
|
|
|
static void wb_update_write_bandwidth(struct bdi_writeback *wb,
|
|
unsigned long elapsed,
|
|
unsigned long written)
|
|
{
|
|
const unsigned long period = roundup_pow_of_two(3 * HZ);
|
|
unsigned long avg = wb->avg_write_bandwidth;
|
|
unsigned long old = wb->write_bandwidth;
|
|
u64 bw;
|
|
|
|
/*
|
|
* bw = written * HZ / elapsed
|
|
*
|
|
* bw * elapsed + write_bandwidth * (period - elapsed)
|
|
* write_bandwidth = ---------------------------------------------------
|
|
* period
|
|
*
|
|
* @written may have decreased due to account_page_redirty().
|
|
* Avoid underflowing @bw calculation.
|
|
*/
|
|
bw = written - min(written, wb->written_stamp);
|
|
bw *= HZ;
|
|
if (unlikely(elapsed > period)) {
|
|
do_div(bw, elapsed);
|
|
avg = bw;
|
|
goto out;
|
|
}
|
|
bw += (u64)wb->write_bandwidth * (period - elapsed);
|
|
bw >>= ilog2(period);
|
|
|
|
/*
|
|
* one more level of smoothing, for filtering out sudden spikes
|
|
*/
|
|
if (avg > old && old >= (unsigned long)bw)
|
|
avg -= (avg - old) >> 3;
|
|
|
|
if (avg < old && old <= (unsigned long)bw)
|
|
avg += (old - avg) >> 3;
|
|
|
|
out:
|
|
/* keep avg > 0 to guarantee that tot > 0 if there are dirty wbs */
|
|
avg = max(avg, 1LU);
|
|
if (wb_has_dirty_io(wb)) {
|
|
long delta = avg - wb->avg_write_bandwidth;
|
|
WARN_ON_ONCE(atomic_long_add_return(delta,
|
|
&wb->bdi->tot_write_bandwidth) <= 0);
|
|
}
|
|
wb->write_bandwidth = bw;
|
|
wb->avg_write_bandwidth = avg;
|
|
}
|
|
|
|
static void update_dirty_limit(struct dirty_throttle_control *dtc)
|
|
{
|
|
struct wb_domain *dom = dtc_dom(dtc);
|
|
unsigned long thresh = dtc->thresh;
|
|
unsigned long limit = dom->dirty_limit;
|
|
|
|
/*
|
|
* Follow up in one step.
|
|
*/
|
|
if (limit < thresh) {
|
|
limit = thresh;
|
|
goto update;
|
|
}
|
|
|
|
/*
|
|
* Follow down slowly. Use the higher one as the target, because thresh
|
|
* may drop below dirty. This is exactly the reason to introduce
|
|
* dom->dirty_limit which is guaranteed to lie above the dirty pages.
|
|
*/
|
|
thresh = max(thresh, dtc->dirty);
|
|
if (limit > thresh) {
|
|
limit -= (limit - thresh) >> 5;
|
|
goto update;
|
|
}
|
|
return;
|
|
update:
|
|
dom->dirty_limit = limit;
|
|
}
|
|
|
|
static void domain_update_bandwidth(struct dirty_throttle_control *dtc,
|
|
unsigned long now)
|
|
{
|
|
struct wb_domain *dom = dtc_dom(dtc);
|
|
|
|
/*
|
|
* check locklessly first to optimize away locking for the most time
|
|
*/
|
|
if (time_before(now, dom->dirty_limit_tstamp + BANDWIDTH_INTERVAL))
|
|
return;
|
|
|
|
spin_lock(&dom->lock);
|
|
if (time_after_eq(now, dom->dirty_limit_tstamp + BANDWIDTH_INTERVAL)) {
|
|
update_dirty_limit(dtc);
|
|
dom->dirty_limit_tstamp = now;
|
|
}
|
|
spin_unlock(&dom->lock);
|
|
}
|
|
|
|
/*
|
|
* Maintain wb->dirty_ratelimit, the base dirty throttle rate.
|
|
*
|
|
* Normal wb tasks will be curbed at or below it in long term.
|
|
* Obviously it should be around (write_bw / N) when there are N dd tasks.
|
|
*/
|
|
static void wb_update_dirty_ratelimit(struct dirty_throttle_control *dtc,
|
|
unsigned long dirtied,
|
|
unsigned long elapsed)
|
|
{
|
|
struct bdi_writeback *wb = dtc->wb;
|
|
unsigned long dirty = dtc->dirty;
|
|
unsigned long freerun = dirty_freerun_ceiling(dtc->thresh, dtc->bg_thresh);
|
|
unsigned long limit = hard_dirty_limit(dtc_dom(dtc), dtc->thresh);
|
|
unsigned long setpoint = (freerun + limit) / 2;
|
|
unsigned long write_bw = wb->avg_write_bandwidth;
|
|
unsigned long dirty_ratelimit = wb->dirty_ratelimit;
|
|
unsigned long dirty_rate;
|
|
unsigned long task_ratelimit;
|
|
unsigned long balanced_dirty_ratelimit;
|
|
unsigned long step;
|
|
unsigned long x;
|
|
unsigned long shift;
|
|
|
|
/*
|
|
* The dirty rate will match the writeout rate in long term, except
|
|
* when dirty pages are truncated by userspace or re-dirtied by FS.
|
|
*/
|
|
dirty_rate = (dirtied - wb->dirtied_stamp) * HZ / elapsed;
|
|
|
|
/*
|
|
* task_ratelimit reflects each dd's dirty rate for the past 200ms.
|
|
*/
|
|
task_ratelimit = (u64)dirty_ratelimit *
|
|
dtc->pos_ratio >> RATELIMIT_CALC_SHIFT;
|
|
task_ratelimit++; /* it helps rampup dirty_ratelimit from tiny values */
|
|
|
|
/*
|
|
* A linear estimation of the "balanced" throttle rate. The theory is,
|
|
* if there are N dd tasks, each throttled at task_ratelimit, the wb's
|
|
* dirty_rate will be measured to be (N * task_ratelimit). So the below
|
|
* formula will yield the balanced rate limit (write_bw / N).
|
|
*
|
|
* Note that the expanded form is not a pure rate feedback:
|
|
* rate_(i+1) = rate_(i) * (write_bw / dirty_rate) (1)
|
|
* but also takes pos_ratio into account:
|
|
* rate_(i+1) = rate_(i) * (write_bw / dirty_rate) * pos_ratio (2)
|
|
*
|
|
* (1) is not realistic because pos_ratio also takes part in balancing
|
|
* the dirty rate. Consider the state
|
|
* pos_ratio = 0.5 (3)
|
|
* rate = 2 * (write_bw / N) (4)
|
|
* If (1) is used, it will stuck in that state! Because each dd will
|
|
* be throttled at
|
|
* task_ratelimit = pos_ratio * rate = (write_bw / N) (5)
|
|
* yielding
|
|
* dirty_rate = N * task_ratelimit = write_bw (6)
|
|
* put (6) into (1) we get
|
|
* rate_(i+1) = rate_(i) (7)
|
|
*
|
|
* So we end up using (2) to always keep
|
|
* rate_(i+1) ~= (write_bw / N) (8)
|
|
* regardless of the value of pos_ratio. As long as (8) is satisfied,
|
|
* pos_ratio is able to drive itself to 1.0, which is not only where
|
|
* the dirty count meet the setpoint, but also where the slope of
|
|
* pos_ratio is most flat and hence task_ratelimit is least fluctuated.
|
|
*/
|
|
balanced_dirty_ratelimit = div_u64((u64)task_ratelimit * write_bw,
|
|
dirty_rate | 1);
|
|
/*
|
|
* balanced_dirty_ratelimit ~= (write_bw / N) <= write_bw
|
|
*/
|
|
if (unlikely(balanced_dirty_ratelimit > write_bw))
|
|
balanced_dirty_ratelimit = write_bw;
|
|
|
|
/*
|
|
* We could safely do this and return immediately:
|
|
*
|
|
* wb->dirty_ratelimit = balanced_dirty_ratelimit;
|
|
*
|
|
* However to get a more stable dirty_ratelimit, the below elaborated
|
|
* code makes use of task_ratelimit to filter out singular points and
|
|
* limit the step size.
|
|
*
|
|
* The below code essentially only uses the relative value of
|
|
*
|
|
* task_ratelimit - dirty_ratelimit
|
|
* = (pos_ratio - 1) * dirty_ratelimit
|
|
*
|
|
* which reflects the direction and size of dirty position error.
|
|
*/
|
|
|
|
/*
|
|
* dirty_ratelimit will follow balanced_dirty_ratelimit iff
|
|
* task_ratelimit is on the same side of dirty_ratelimit, too.
|
|
* For example, when
|
|
* - dirty_ratelimit > balanced_dirty_ratelimit
|
|
* - dirty_ratelimit > task_ratelimit (dirty pages are above setpoint)
|
|
* lowering dirty_ratelimit will help meet both the position and rate
|
|
* control targets. Otherwise, don't update dirty_ratelimit if it will
|
|
* only help meet the rate target. After all, what the users ultimately
|
|
* feel and care are stable dirty rate and small position error.
|
|
*
|
|
* |task_ratelimit - dirty_ratelimit| is used to limit the step size
|
|
* and filter out the singular points of balanced_dirty_ratelimit. Which
|
|
* keeps jumping around randomly and can even leap far away at times
|
|
* due to the small 200ms estimation period of dirty_rate (we want to
|
|
* keep that period small to reduce time lags).
|
|
*/
|
|
step = 0;
|
|
|
|
/*
|
|
* For strictlimit case, calculations above were based on wb counters
|
|
* and limits (starting from pos_ratio = wb_position_ratio() and up to
|
|
* balanced_dirty_ratelimit = task_ratelimit * write_bw / dirty_rate).
|
|
* Hence, to calculate "step" properly, we have to use wb_dirty as
|
|
* "dirty" and wb_setpoint as "setpoint".
|
|
*
|
|
* We rampup dirty_ratelimit forcibly if wb_dirty is low because
|
|
* it's possible that wb_thresh is close to zero due to inactivity
|
|
* of backing device.
|
|
*/
|
|
if (unlikely(wb->bdi->capabilities & BDI_CAP_STRICTLIMIT)) {
|
|
dirty = dtc->wb_dirty;
|
|
if (dtc->wb_dirty < 8)
|
|
setpoint = dtc->wb_dirty + 1;
|
|
else
|
|
setpoint = (dtc->wb_thresh + dtc->wb_bg_thresh) / 2;
|
|
}
|
|
|
|
if (dirty < setpoint) {
|
|
x = min3(wb->balanced_dirty_ratelimit,
|
|
balanced_dirty_ratelimit, task_ratelimit);
|
|
if (dirty_ratelimit < x)
|
|
step = x - dirty_ratelimit;
|
|
} else {
|
|
x = max3(wb->balanced_dirty_ratelimit,
|
|
balanced_dirty_ratelimit, task_ratelimit);
|
|
if (dirty_ratelimit > x)
|
|
step = dirty_ratelimit - x;
|
|
}
|
|
|
|
/*
|
|
* Don't pursue 100% rate matching. It's impossible since the balanced
|
|
* rate itself is constantly fluctuating. So decrease the track speed
|
|
* when it gets close to the target. Helps eliminate pointless tremors.
|
|
*/
|
|
shift = dirty_ratelimit / (2 * step + 1);
|
|
if (shift < BITS_PER_LONG)
|
|
step = DIV_ROUND_UP(step >> shift, 8);
|
|
else
|
|
step = 0;
|
|
|
|
if (dirty_ratelimit < balanced_dirty_ratelimit)
|
|
dirty_ratelimit += step;
|
|
else
|
|
dirty_ratelimit -= step;
|
|
|
|
wb->dirty_ratelimit = max(dirty_ratelimit, 1UL);
|
|
wb->balanced_dirty_ratelimit = balanced_dirty_ratelimit;
|
|
|
|
trace_bdi_dirty_ratelimit(wb, dirty_rate, task_ratelimit);
|
|
}
|
|
|
|
static void __wb_update_bandwidth(struct dirty_throttle_control *gdtc,
|
|
struct dirty_throttle_control *mdtc,
|
|
unsigned long start_time,
|
|
bool update_ratelimit)
|
|
{
|
|
struct bdi_writeback *wb = gdtc->wb;
|
|
unsigned long now = jiffies;
|
|
unsigned long elapsed = now - wb->bw_time_stamp;
|
|
unsigned long dirtied;
|
|
unsigned long written;
|
|
|
|
lockdep_assert_held(&wb->list_lock);
|
|
|
|
/*
|
|
* rate-limit, only update once every 200ms.
|
|
*/
|
|
if (elapsed < BANDWIDTH_INTERVAL)
|
|
return;
|
|
|
|
dirtied = percpu_counter_read(&wb->stat[WB_DIRTIED]);
|
|
written = percpu_counter_read(&wb->stat[WB_WRITTEN]);
|
|
|
|
/*
|
|
* Skip quiet periods when disk bandwidth is under-utilized.
|
|
* (at least 1s idle time between two flusher runs)
|
|
*/
|
|
if (elapsed > HZ && time_before(wb->bw_time_stamp, start_time))
|
|
goto snapshot;
|
|
|
|
if (update_ratelimit) {
|
|
domain_update_bandwidth(gdtc, now);
|
|
wb_update_dirty_ratelimit(gdtc, dirtied, elapsed);
|
|
|
|
/*
|
|
* @mdtc is always NULL if !CGROUP_WRITEBACK but the
|
|
* compiler has no way to figure that out. Help it.
|
|
*/
|
|
if (IS_ENABLED(CONFIG_CGROUP_WRITEBACK) && mdtc) {
|
|
domain_update_bandwidth(mdtc, now);
|
|
wb_update_dirty_ratelimit(mdtc, dirtied, elapsed);
|
|
}
|
|
}
|
|
wb_update_write_bandwidth(wb, elapsed, written);
|
|
|
|
snapshot:
|
|
wb->dirtied_stamp = dirtied;
|
|
wb->written_stamp = written;
|
|
wb->bw_time_stamp = now;
|
|
}
|
|
|
|
void wb_update_bandwidth(struct bdi_writeback *wb, unsigned long start_time)
|
|
{
|
|
struct dirty_throttle_control gdtc = { GDTC_INIT(wb) };
|
|
|
|
__wb_update_bandwidth(&gdtc, NULL, start_time, false);
|
|
}
|
|
|
|
/*
|
|
* After a task dirtied this many pages, balance_dirty_pages_ratelimited()
|
|
* will look to see if it needs to start dirty throttling.
|
|
*
|
|
* If dirty_poll_interval is too low, big NUMA machines will call the expensive
|
|
* global_zone_page_state() too often. So scale it near-sqrt to the safety margin
|
|
* (the number of pages we may dirty without exceeding the dirty limits).
|
|
*/
|
|
static unsigned long dirty_poll_interval(unsigned long dirty,
|
|
unsigned long thresh)
|
|
{
|
|
if (thresh > dirty)
|
|
return 1UL << (ilog2(thresh - dirty) >> 1);
|
|
|
|
return 1;
|
|
}
|
|
|
|
static unsigned long wb_max_pause(struct bdi_writeback *wb,
|
|
unsigned long wb_dirty)
|
|
{
|
|
unsigned long bw = wb->avg_write_bandwidth;
|
|
unsigned long t;
|
|
|
|
/*
|
|
* Limit pause time for small memory systems. If sleeping for too long
|
|
* time, a small pool of dirty/writeback pages may go empty and disk go
|
|
* idle.
|
|
*
|
|
* 8 serves as the safety ratio.
|
|
*/
|
|
t = wb_dirty / (1 + bw / roundup_pow_of_two(1 + HZ / 8));
|
|
t++;
|
|
|
|
return min_t(unsigned long, t, MAX_PAUSE);
|
|
}
|
|
|
|
static long wb_min_pause(struct bdi_writeback *wb,
|
|
long max_pause,
|
|
unsigned long task_ratelimit,
|
|
unsigned long dirty_ratelimit,
|
|
int *nr_dirtied_pause)
|
|
{
|
|
long hi = ilog2(wb->avg_write_bandwidth);
|
|
long lo = ilog2(wb->dirty_ratelimit);
|
|
long t; /* target pause */
|
|
long pause; /* estimated next pause */
|
|
int pages; /* target nr_dirtied_pause */
|
|
|
|
/* target for 10ms pause on 1-dd case */
|
|
t = max(1, HZ / 100);
|
|
|
|
/*
|
|
* Scale up pause time for concurrent dirtiers in order to reduce CPU
|
|
* overheads.
|
|
*
|
|
* (N * 10ms) on 2^N concurrent tasks.
|
|
*/
|
|
if (hi > lo)
|
|
t += (hi - lo) * (10 * HZ) / 1024;
|
|
|
|
/*
|
|
* This is a bit convoluted. We try to base the next nr_dirtied_pause
|
|
* on the much more stable dirty_ratelimit. However the next pause time
|
|
* will be computed based on task_ratelimit and the two rate limits may
|
|
* depart considerably at some time. Especially if task_ratelimit goes
|
|
* below dirty_ratelimit/2 and the target pause is max_pause, the next
|
|
* pause time will be max_pause*2 _trimmed down_ to max_pause. As a
|
|
* result task_ratelimit won't be executed faithfully, which could
|
|
* eventually bring down dirty_ratelimit.
|
|
*
|
|
* We apply two rules to fix it up:
|
|
* 1) try to estimate the next pause time and if necessary, use a lower
|
|
* nr_dirtied_pause so as not to exceed max_pause. When this happens,
|
|
* nr_dirtied_pause will be "dancing" with task_ratelimit.
|
|
* 2) limit the target pause time to max_pause/2, so that the normal
|
|
* small fluctuations of task_ratelimit won't trigger rule (1) and
|
|
* nr_dirtied_pause will remain as stable as dirty_ratelimit.
|
|
*/
|
|
t = min(t, 1 + max_pause / 2);
|
|
pages = dirty_ratelimit * t / roundup_pow_of_two(HZ);
|
|
|
|
/*
|
|
* Tiny nr_dirtied_pause is found to hurt I/O performance in the test
|
|
* case fio-mmap-randwrite-64k, which does 16*{sync read, async write}.
|
|
* When the 16 consecutive reads are often interrupted by some dirty
|
|
* throttling pause during the async writes, cfq will go into idles
|
|
* (deadline is fine). So push nr_dirtied_pause as high as possible
|
|
* until reaches DIRTY_POLL_THRESH=32 pages.
|
|
*/
|
|
if (pages < DIRTY_POLL_THRESH) {
|
|
t = max_pause;
|
|
pages = dirty_ratelimit * t / roundup_pow_of_two(HZ);
|
|
if (pages > DIRTY_POLL_THRESH) {
|
|
pages = DIRTY_POLL_THRESH;
|
|
t = HZ * DIRTY_POLL_THRESH / dirty_ratelimit;
|
|
}
|
|
}
|
|
|
|
pause = HZ * pages / (task_ratelimit + 1);
|
|
if (pause > max_pause) {
|
|
t = max_pause;
|
|
pages = task_ratelimit * t / roundup_pow_of_two(HZ);
|
|
}
|
|
|
|
*nr_dirtied_pause = pages;
|
|
/*
|
|
* The minimal pause time will normally be half the target pause time.
|
|
*/
|
|
return pages >= DIRTY_POLL_THRESH ? 1 + t / 2 : t;
|
|
}
|
|
|
|
static inline void wb_dirty_limits(struct dirty_throttle_control *dtc)
|
|
{
|
|
struct bdi_writeback *wb = dtc->wb;
|
|
unsigned long wb_reclaimable;
|
|
|
|
/*
|
|
* wb_thresh is not treated as some limiting factor as
|
|
* dirty_thresh, due to reasons
|
|
* - in JBOD setup, wb_thresh can fluctuate a lot
|
|
* - in a system with HDD and USB key, the USB key may somehow
|
|
* go into state (wb_dirty >> wb_thresh) either because
|
|
* wb_dirty starts high, or because wb_thresh drops low.
|
|
* In this case we don't want to hard throttle the USB key
|
|
* dirtiers for 100 seconds until wb_dirty drops under
|
|
* wb_thresh. Instead the auxiliary wb control line in
|
|
* wb_position_ratio() will let the dirtier task progress
|
|
* at some rate <= (write_bw / 2) for bringing down wb_dirty.
|
|
*/
|
|
dtc->wb_thresh = __wb_calc_thresh(dtc);
|
|
dtc->wb_bg_thresh = dtc->thresh ?
|
|
div_u64((u64)dtc->wb_thresh * dtc->bg_thresh, dtc->thresh) : 0;
|
|
|
|
/*
|
|
* In order to avoid the stacked BDI deadlock we need
|
|
* to ensure we accurately count the 'dirty' pages when
|
|
* the threshold is low.
|
|
*
|
|
* Otherwise it would be possible to get thresh+n pages
|
|
* reported dirty, even though there are thresh-m pages
|
|
* actually dirty; with m+n sitting in the percpu
|
|
* deltas.
|
|
*/
|
|
if (dtc->wb_thresh < 2 * wb_stat_error()) {
|
|
wb_reclaimable = wb_stat_sum(wb, WB_RECLAIMABLE);
|
|
dtc->wb_dirty = wb_reclaimable + wb_stat_sum(wb, WB_WRITEBACK);
|
|
} else {
|
|
wb_reclaimable = wb_stat(wb, WB_RECLAIMABLE);
|
|
dtc->wb_dirty = wb_reclaimable + wb_stat(wb, WB_WRITEBACK);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* balance_dirty_pages() must be called by processes which are generating dirty
|
|
* data. It looks at the number of dirty pages in the machine and will force
|
|
* the caller to wait once crossing the (background_thresh + dirty_thresh) / 2.
|
|
* If we're over `background_thresh' then the writeback threads are woken to
|
|
* perform some writeout.
|
|
*/
|
|
static void balance_dirty_pages(struct bdi_writeback *wb,
|
|
unsigned long pages_dirtied)
|
|
{
|
|
struct dirty_throttle_control gdtc_stor = { GDTC_INIT(wb) };
|
|
struct dirty_throttle_control mdtc_stor = { MDTC_INIT(wb, &gdtc_stor) };
|
|
struct dirty_throttle_control * const gdtc = &gdtc_stor;
|
|
struct dirty_throttle_control * const mdtc = mdtc_valid(&mdtc_stor) ?
|
|
&mdtc_stor : NULL;
|
|
struct dirty_throttle_control *sdtc;
|
|
unsigned long nr_reclaimable; /* = file_dirty + unstable_nfs */
|
|
long period;
|
|
long pause;
|
|
long max_pause;
|
|
long min_pause;
|
|
int nr_dirtied_pause;
|
|
bool dirty_exceeded = false;
|
|
unsigned long task_ratelimit;
|
|
unsigned long dirty_ratelimit;
|
|
struct backing_dev_info *bdi = wb->bdi;
|
|
bool strictlimit = bdi->capabilities & BDI_CAP_STRICTLIMIT;
|
|
unsigned long start_time = jiffies;
|
|
|
|
for (;;) {
|
|
unsigned long now = jiffies;
|
|
unsigned long dirty, thresh, bg_thresh;
|
|
unsigned long m_dirty = 0; /* stop bogus uninit warnings */
|
|
unsigned long m_thresh = 0;
|
|
unsigned long m_bg_thresh = 0;
|
|
|
|
/*
|
|
* Unstable writes are a feature of certain networked
|
|
* filesystems (i.e. NFS) in which data may have been
|
|
* written to the server's write cache, but has not yet
|
|
* been flushed to permanent storage.
|
|
*/
|
|
nr_reclaimable = global_node_page_state(NR_FILE_DIRTY) +
|
|
global_node_page_state(NR_UNSTABLE_NFS);
|
|
gdtc->avail = global_dirtyable_memory();
|
|
gdtc->dirty = nr_reclaimable + global_node_page_state(NR_WRITEBACK);
|
|
|
|
domain_dirty_limits(gdtc);
|
|
|
|
if (unlikely(strictlimit)) {
|
|
wb_dirty_limits(gdtc);
|
|
|
|
dirty = gdtc->wb_dirty;
|
|
thresh = gdtc->wb_thresh;
|
|
bg_thresh = gdtc->wb_bg_thresh;
|
|
} else {
|
|
dirty = gdtc->dirty;
|
|
thresh = gdtc->thresh;
|
|
bg_thresh = gdtc->bg_thresh;
|
|
}
|
|
|
|
if (mdtc) {
|
|
unsigned long filepages, headroom, writeback;
|
|
|
|
/*
|
|
* If @wb belongs to !root memcg, repeat the same
|
|
* basic calculations for the memcg domain.
|
|
*/
|
|
mem_cgroup_wb_stats(wb, &filepages, &headroom,
|
|
&mdtc->dirty, &writeback);
|
|
mdtc->dirty += writeback;
|
|
mdtc_calc_avail(mdtc, filepages, headroom);
|
|
|
|
domain_dirty_limits(mdtc);
|
|
|
|
if (unlikely(strictlimit)) {
|
|
wb_dirty_limits(mdtc);
|
|
m_dirty = mdtc->wb_dirty;
|
|
m_thresh = mdtc->wb_thresh;
|
|
m_bg_thresh = mdtc->wb_bg_thresh;
|
|
} else {
|
|
m_dirty = mdtc->dirty;
|
|
m_thresh = mdtc->thresh;
|
|
m_bg_thresh = mdtc->bg_thresh;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Throttle it only when the background writeback cannot
|
|
* catch-up. This avoids (excessively) small writeouts
|
|
* when the wb limits are ramping up in case of !strictlimit.
|
|
*
|
|
* In strictlimit case make decision based on the wb counters
|
|
* and limits. Small writeouts when the wb limits are ramping
|
|
* up are the price we consciously pay for strictlimit-ing.
|
|
*
|
|
* If memcg domain is in effect, @dirty should be under
|
|
* both global and memcg freerun ceilings.
|
|
*/
|
|
if (dirty <= dirty_freerun_ceiling(thresh, bg_thresh) &&
|
|
(!mdtc ||
|
|
m_dirty <= dirty_freerun_ceiling(m_thresh, m_bg_thresh))) {
|
|
unsigned long intv = dirty_poll_interval(dirty, thresh);
|
|
unsigned long m_intv = ULONG_MAX;
|
|
|
|
current->dirty_paused_when = now;
|
|
current->nr_dirtied = 0;
|
|
if (mdtc)
|
|
m_intv = dirty_poll_interval(m_dirty, m_thresh);
|
|
current->nr_dirtied_pause = min(intv, m_intv);
|
|
break;
|
|
}
|
|
|
|
if (unlikely(!writeback_in_progress(wb)))
|
|
wb_start_background_writeback(wb);
|
|
|
|
/*
|
|
* Calculate global domain's pos_ratio and select the
|
|
* global dtc by default.
|
|
*/
|
|
if (!strictlimit)
|
|
wb_dirty_limits(gdtc);
|
|
|
|
dirty_exceeded = (gdtc->wb_dirty > gdtc->wb_thresh) &&
|
|
((gdtc->dirty > gdtc->thresh) || strictlimit);
|
|
|
|
wb_position_ratio(gdtc);
|
|
sdtc = gdtc;
|
|
|
|
if (mdtc) {
|
|
/*
|
|
* If memcg domain is in effect, calculate its
|
|
* pos_ratio. @wb should satisfy constraints from
|
|
* both global and memcg domains. Choose the one
|
|
* w/ lower pos_ratio.
|
|
*/
|
|
if (!strictlimit)
|
|
wb_dirty_limits(mdtc);
|
|
|
|
dirty_exceeded |= (mdtc->wb_dirty > mdtc->wb_thresh) &&
|
|
((mdtc->dirty > mdtc->thresh) || strictlimit);
|
|
|
|
wb_position_ratio(mdtc);
|
|
if (mdtc->pos_ratio < gdtc->pos_ratio)
|
|
sdtc = mdtc;
|
|
}
|
|
|
|
if (dirty_exceeded && !wb->dirty_exceeded)
|
|
wb->dirty_exceeded = 1;
|
|
|
|
if (time_is_before_jiffies(wb->bw_time_stamp +
|
|
BANDWIDTH_INTERVAL)) {
|
|
spin_lock(&wb->list_lock);
|
|
__wb_update_bandwidth(gdtc, mdtc, start_time, true);
|
|
spin_unlock(&wb->list_lock);
|
|
}
|
|
|
|
/* throttle according to the chosen dtc */
|
|
dirty_ratelimit = wb->dirty_ratelimit;
|
|
task_ratelimit = ((u64)dirty_ratelimit * sdtc->pos_ratio) >>
|
|
RATELIMIT_CALC_SHIFT;
|
|
max_pause = wb_max_pause(wb, sdtc->wb_dirty);
|
|
min_pause = wb_min_pause(wb, max_pause,
|
|
task_ratelimit, dirty_ratelimit,
|
|
&nr_dirtied_pause);
|
|
|
|
if (unlikely(task_ratelimit == 0)) {
|
|
period = max_pause;
|
|
pause = max_pause;
|
|
goto pause;
|
|
}
|
|
period = HZ * pages_dirtied / task_ratelimit;
|
|
pause = period;
|
|
if (current->dirty_paused_when)
|
|
pause -= now - current->dirty_paused_when;
|
|
/*
|
|
* For less than 1s think time (ext3/4 may block the dirtier
|
|
* for up to 800ms from time to time on 1-HDD; so does xfs,
|
|
* however at much less frequency), try to compensate it in
|
|
* future periods by updating the virtual time; otherwise just
|
|
* do a reset, as it may be a light dirtier.
|
|
*/
|
|
if (pause < min_pause) {
|
|
trace_balance_dirty_pages(wb,
|
|
sdtc->thresh,
|
|
sdtc->bg_thresh,
|
|
sdtc->dirty,
|
|
sdtc->wb_thresh,
|
|
sdtc->wb_dirty,
|
|
dirty_ratelimit,
|
|
task_ratelimit,
|
|
pages_dirtied,
|
|
period,
|
|
min(pause, 0L),
|
|
start_time);
|
|
if (pause < -HZ) {
|
|
current->dirty_paused_when = now;
|
|
current->nr_dirtied = 0;
|
|
} else if (period) {
|
|
current->dirty_paused_when += period;
|
|
current->nr_dirtied = 0;
|
|
} else if (current->nr_dirtied_pause <= pages_dirtied)
|
|
current->nr_dirtied_pause += pages_dirtied;
|
|
break;
|
|
}
|
|
if (unlikely(pause > max_pause)) {
|
|
/* for occasional dropped task_ratelimit */
|
|
now += min(pause - max_pause, max_pause);
|
|
pause = max_pause;
|
|
}
|
|
|
|
pause:
|
|
trace_balance_dirty_pages(wb,
|
|
sdtc->thresh,
|
|
sdtc->bg_thresh,
|
|
sdtc->dirty,
|
|
sdtc->wb_thresh,
|
|
sdtc->wb_dirty,
|
|
dirty_ratelimit,
|
|
task_ratelimit,
|
|
pages_dirtied,
|
|
period,
|
|
pause,
|
|
start_time);
|
|
__set_current_state(TASK_KILLABLE);
|
|
wb->dirty_sleep = now;
|
|
io_schedule_timeout(pause);
|
|
|
|
current->dirty_paused_when = now + pause;
|
|
current->nr_dirtied = 0;
|
|
current->nr_dirtied_pause = nr_dirtied_pause;
|
|
|
|
/*
|
|
* This is typically equal to (dirty < thresh) and can also
|
|
* keep "1000+ dd on a slow USB stick" under control.
|
|
*/
|
|
if (task_ratelimit)
|
|
break;
|
|
|
|
/*
|
|
* In the case of an unresponding NFS server and the NFS dirty
|
|
* pages exceeds dirty_thresh, give the other good wb's a pipe
|
|
* to go through, so that tasks on them still remain responsive.
|
|
*
|
|
* In theory 1 page is enough to keep the consumer-producer
|
|
* pipe going: the flusher cleans 1 page => the task dirties 1
|
|
* more page. However wb_dirty has accounting errors. So use
|
|
* the larger and more IO friendly wb_stat_error.
|
|
*/
|
|
if (sdtc->wb_dirty <= wb_stat_error())
|
|
break;
|
|
|
|
if (fatal_signal_pending(current))
|
|
break;
|
|
}
|
|
|
|
if (!dirty_exceeded && wb->dirty_exceeded)
|
|
wb->dirty_exceeded = 0;
|
|
|
|
if (writeback_in_progress(wb))
|
|
return;
|
|
|
|
/*
|
|
* In laptop mode, we wait until hitting the higher threshold before
|
|
* starting background writeout, and then write out all the way down
|
|
* to the lower threshold. So slow writers cause minimal disk activity.
|
|
*
|
|
* In normal mode, we start background writeout at the lower
|
|
* background_thresh, to keep the amount of dirty memory low.
|
|
*/
|
|
if (laptop_mode)
|
|
return;
|
|
|
|
if (nr_reclaimable > gdtc->bg_thresh)
|
|
wb_start_background_writeback(wb);
|
|
}
|
|
|
|
static DEFINE_PER_CPU(int, bdp_ratelimits);
|
|
|
|
/*
|
|
* Normal tasks are throttled by
|
|
* loop {
|
|
* dirty tsk->nr_dirtied_pause pages;
|
|
* take a snap in balance_dirty_pages();
|
|
* }
|
|
* However there is a worst case. If every task exit immediately when dirtied
|
|
* (tsk->nr_dirtied_pause - 1) pages, balance_dirty_pages() will never be
|
|
* called to throttle the page dirties. The solution is to save the not yet
|
|
* throttled page dirties in dirty_throttle_leaks on task exit and charge them
|
|
* randomly into the running tasks. This works well for the above worst case,
|
|
* as the new task will pick up and accumulate the old task's leaked dirty
|
|
* count and eventually get throttled.
|
|
*/
|
|
DEFINE_PER_CPU(int, dirty_throttle_leaks) = 0;
|
|
|
|
/**
|
|
* balance_dirty_pages_ratelimited - balance dirty memory state
|
|
* @mapping: address_space which was dirtied
|
|
*
|
|
* Processes which are dirtying memory should call in here once for each page
|
|
* which was newly dirtied. The function will periodically check the system's
|
|
* dirty state and will initiate writeback if needed.
|
|
*
|
|
* On really big machines, get_writeback_state is expensive, so try to avoid
|
|
* calling it too often (ratelimiting). But once we're over the dirty memory
|
|
* limit we decrease the ratelimiting by a lot, to prevent individual processes
|
|
* from overshooting the limit by (ratelimit_pages) each.
|
|
*/
|
|
void balance_dirty_pages_ratelimited(struct address_space *mapping)
|
|
{
|
|
struct inode *inode = mapping->host;
|
|
struct backing_dev_info *bdi = inode_to_bdi(inode);
|
|
struct bdi_writeback *wb = NULL;
|
|
int ratelimit;
|
|
int *p;
|
|
|
|
if (!bdi_cap_account_dirty(bdi))
|
|
return;
|
|
|
|
if (inode_cgwb_enabled(inode))
|
|
wb = wb_get_create_current(bdi, GFP_KERNEL);
|
|
if (!wb)
|
|
wb = &bdi->wb;
|
|
|
|
ratelimit = current->nr_dirtied_pause;
|
|
if (wb->dirty_exceeded)
|
|
ratelimit = min(ratelimit, 32 >> (PAGE_SHIFT - 10));
|
|
|
|
preempt_disable();
|
|
/*
|
|
* This prevents one CPU to accumulate too many dirtied pages without
|
|
* calling into balance_dirty_pages(), which can happen when there are
|
|
* 1000+ tasks, all of them start dirtying pages at exactly the same
|
|
* time, hence all honoured too large initial task->nr_dirtied_pause.
|
|
*/
|
|
p = this_cpu_ptr(&bdp_ratelimits);
|
|
if (unlikely(current->nr_dirtied >= ratelimit))
|
|
*p = 0;
|
|
else if (unlikely(*p >= ratelimit_pages)) {
|
|
*p = 0;
|
|
ratelimit = 0;
|
|
}
|
|
/*
|
|
* Pick up the dirtied pages by the exited tasks. This avoids lots of
|
|
* short-lived tasks (eg. gcc invocations in a kernel build) escaping
|
|
* the dirty throttling and livelock other long-run dirtiers.
|
|
*/
|
|
p = this_cpu_ptr(&dirty_throttle_leaks);
|
|
if (*p > 0 && current->nr_dirtied < ratelimit) {
|
|
unsigned long nr_pages_dirtied;
|
|
nr_pages_dirtied = min(*p, ratelimit - current->nr_dirtied);
|
|
*p -= nr_pages_dirtied;
|
|
current->nr_dirtied += nr_pages_dirtied;
|
|
}
|
|
preempt_enable();
|
|
|
|
if (unlikely(current->nr_dirtied >= ratelimit))
|
|
balance_dirty_pages(wb, current->nr_dirtied);
|
|
|
|
wb_put(wb);
|
|
}
|
|
EXPORT_SYMBOL(balance_dirty_pages_ratelimited);
|
|
|
|
/**
|
|
* wb_over_bg_thresh - does @wb need to be written back?
|
|
* @wb: bdi_writeback of interest
|
|
*
|
|
* Determines whether background writeback should keep writing @wb or it's
|
|
* clean enough. Returns %true if writeback should continue.
|
|
*/
|
|
bool wb_over_bg_thresh(struct bdi_writeback *wb)
|
|
{
|
|
struct dirty_throttle_control gdtc_stor = { GDTC_INIT(wb) };
|
|
struct dirty_throttle_control mdtc_stor = { MDTC_INIT(wb, &gdtc_stor) };
|
|
struct dirty_throttle_control * const gdtc = &gdtc_stor;
|
|
struct dirty_throttle_control * const mdtc = mdtc_valid(&mdtc_stor) ?
|
|
&mdtc_stor : NULL;
|
|
|
|
/*
|
|
* Similar to balance_dirty_pages() but ignores pages being written
|
|
* as we're trying to decide whether to put more under writeback.
|
|
*/
|
|
gdtc->avail = global_dirtyable_memory();
|
|
gdtc->dirty = global_node_page_state(NR_FILE_DIRTY) +
|
|
global_node_page_state(NR_UNSTABLE_NFS);
|
|
domain_dirty_limits(gdtc);
|
|
|
|
if (gdtc->dirty > gdtc->bg_thresh)
|
|
return true;
|
|
|
|
if (wb_stat(wb, WB_RECLAIMABLE) >
|
|
wb_calc_thresh(gdtc->wb, gdtc->bg_thresh))
|
|
return true;
|
|
|
|
if (mdtc) {
|
|
unsigned long filepages, headroom, writeback;
|
|
|
|
mem_cgroup_wb_stats(wb, &filepages, &headroom, &mdtc->dirty,
|
|
&writeback);
|
|
mdtc_calc_avail(mdtc, filepages, headroom);
|
|
domain_dirty_limits(mdtc); /* ditto, ignore writeback */
|
|
|
|
if (mdtc->dirty > mdtc->bg_thresh)
|
|
return true;
|
|
|
|
if (wb_stat(wb, WB_RECLAIMABLE) >
|
|
wb_calc_thresh(mdtc->wb, mdtc->bg_thresh))
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* sysctl handler for /proc/sys/vm/dirty_writeback_centisecs
|
|
*/
|
|
int dirty_writeback_centisecs_handler(struct ctl_table *table, int write,
|
|
void *buffer, size_t *length, loff_t *ppos)
|
|
{
|
|
unsigned int old_interval = dirty_writeback_interval;
|
|
int ret;
|
|
|
|
ret = proc_dointvec(table, write, buffer, length, ppos);
|
|
|
|
/*
|
|
* Writing 0 to dirty_writeback_interval will disable periodic writeback
|
|
* and a different non-zero value will wakeup the writeback threads.
|
|
* wb_wakeup_delayed() would be more appropriate, but it's a pain to
|
|
* iterate over all bdis and wbs.
|
|
* The reason we do this is to make the change take effect immediately.
|
|
*/
|
|
if (!ret && write && dirty_writeback_interval &&
|
|
dirty_writeback_interval != old_interval)
|
|
wakeup_flusher_threads(WB_REASON_PERIODIC);
|
|
|
|
return ret;
|
|
}
|
|
|
|
#ifdef CONFIG_BLOCK
|
|
void laptop_mode_timer_fn(struct timer_list *t)
|
|
{
|
|
struct backing_dev_info *backing_dev_info =
|
|
from_timer(backing_dev_info, t, laptop_mode_wb_timer);
|
|
|
|
wakeup_flusher_threads_bdi(backing_dev_info, WB_REASON_LAPTOP_TIMER);
|
|
}
|
|
|
|
/*
|
|
* We've spun up the disk and we're in laptop mode: schedule writeback
|
|
* of all dirty data a few seconds from now. If the flush is already scheduled
|
|
* then push it back - the user is still using the disk.
|
|
*/
|
|
void laptop_io_completion(struct backing_dev_info *info)
|
|
{
|
|
mod_timer(&info->laptop_mode_wb_timer, jiffies + laptop_mode);
|
|
}
|
|
|
|
/*
|
|
* We're in laptop mode and we've just synced. The sync's writes will have
|
|
* caused another writeback to be scheduled by laptop_io_completion.
|
|
* Nothing needs to be written back anymore, so we unschedule the writeback.
|
|
*/
|
|
void laptop_sync_completion(void)
|
|
{
|
|
struct backing_dev_info *bdi;
|
|
|
|
rcu_read_lock();
|
|
|
|
list_for_each_entry_rcu(bdi, &bdi_list, bdi_list)
|
|
del_timer(&bdi->laptop_mode_wb_timer);
|
|
|
|
rcu_read_unlock();
|
|
}
|
|
#endif
|
|
|
|
/*
|
|
* If ratelimit_pages is too high then we can get into dirty-data overload
|
|
* if a large number of processes all perform writes at the same time.
|
|
* If it is too low then SMP machines will call the (expensive)
|
|
* get_writeback_state too often.
|
|
*
|
|
* Here we set ratelimit_pages to a level which ensures that when all CPUs are
|
|
* dirtying in parallel, we cannot go more than 3% (1/32) over the dirty memory
|
|
* thresholds.
|
|
*/
|
|
|
|
void writeback_set_ratelimit(void)
|
|
{
|
|
struct wb_domain *dom = &global_wb_domain;
|
|
unsigned long background_thresh;
|
|
unsigned long dirty_thresh;
|
|
|
|
global_dirty_limits(&background_thresh, &dirty_thresh);
|
|
dom->dirty_limit = dirty_thresh;
|
|
ratelimit_pages = dirty_thresh / (num_online_cpus() * 32);
|
|
if (ratelimit_pages < 16)
|
|
ratelimit_pages = 16;
|
|
}
|
|
|
|
static int page_writeback_cpu_online(unsigned int cpu)
|
|
{
|
|
writeback_set_ratelimit();
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* Called early on to tune the page writeback dirty limits.
|
|
*
|
|
* We used to scale dirty pages according to how total memory
|
|
* related to pages that could be allocated for buffers (by
|
|
* comparing nr_free_buffer_pages() to vm_total_pages.
|
|
*
|
|
* However, that was when we used "dirty_ratio" to scale with
|
|
* all memory, and we don't do that any more. "dirty_ratio"
|
|
* is now applied to total non-HIGHPAGE memory (by subtracting
|
|
* totalhigh_pages from vm_total_pages), and as such we can't
|
|
* get into the old insane situation any more where we had
|
|
* large amounts of dirty pages compared to a small amount of
|
|
* non-HIGHMEM memory.
|
|
*
|
|
* But we might still want to scale the dirty_ratio by how
|
|
* much memory the box has..
|
|
*/
|
|
void __init page_writeback_init(void)
|
|
{
|
|
BUG_ON(wb_domain_init(&global_wb_domain, GFP_KERNEL));
|
|
|
|
cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "mm/writeback:online",
|
|
page_writeback_cpu_online, NULL);
|
|
cpuhp_setup_state(CPUHP_MM_WRITEBACK_DEAD, "mm/writeback:dead", NULL,
|
|
page_writeback_cpu_online);
|
|
}
|
|
|
|
/**
|
|
* tag_pages_for_writeback - tag pages to be written by write_cache_pages
|
|
* @mapping: address space structure to write
|
|
* @start: starting page index
|
|
* @end: ending page index (inclusive)
|
|
*
|
|
* This function scans the page range from @start to @end (inclusive) and tags
|
|
* all pages that have DIRTY tag set with a special TOWRITE tag. The idea is
|
|
* that write_cache_pages (or whoever calls this function) will then use
|
|
* TOWRITE tag to identify pages eligible for writeback. This mechanism is
|
|
* used to avoid livelocking of writeback by a process steadily creating new
|
|
* dirty pages in the file (thus it is important for this function to be quick
|
|
* so that it can tag pages faster than a dirtying process can create them).
|
|
*/
|
|
/*
|
|
* We tag pages in batches of WRITEBACK_TAG_BATCH to reduce the i_pages lock
|
|
* latency.
|
|
*/
|
|
void tag_pages_for_writeback(struct address_space *mapping,
|
|
pgoff_t start, pgoff_t end)
|
|
{
|
|
#define WRITEBACK_TAG_BATCH 4096
|
|
unsigned long tagged = 0;
|
|
struct radix_tree_iter iter;
|
|
void **slot;
|
|
|
|
xa_lock_irq(&mapping->i_pages);
|
|
radix_tree_for_each_tagged(slot, &mapping->i_pages, &iter, start,
|
|
PAGECACHE_TAG_DIRTY) {
|
|
if (iter.index > end)
|
|
break;
|
|
radix_tree_iter_tag_set(&mapping->i_pages, &iter,
|
|
PAGECACHE_TAG_TOWRITE);
|
|
tagged++;
|
|
if ((tagged % WRITEBACK_TAG_BATCH) != 0)
|
|
continue;
|
|
slot = radix_tree_iter_resume(slot, &iter);
|
|
xa_unlock_irq(&mapping->i_pages);
|
|
cond_resched();
|
|
xa_lock_irq(&mapping->i_pages);
|
|
}
|
|
xa_unlock_irq(&mapping->i_pages);
|
|
}
|
|
EXPORT_SYMBOL(tag_pages_for_writeback);
|
|
|
|
/**
|
|
* write_cache_pages - walk the list of dirty pages of the given address space and write all of them.
|
|
* @mapping: address space structure to write
|
|
* @wbc: subtract the number of written pages from *@wbc->nr_to_write
|
|
* @writepage: function called for each page
|
|
* @data: data passed to writepage function
|
|
*
|
|
* If a page is already under I/O, write_cache_pages() skips it, even
|
|
* if it's dirty. This is desirable behaviour for memory-cleaning writeback,
|
|
* but it is INCORRECT for data-integrity system calls such as fsync(). fsync()
|
|
* and msync() need to guarantee that all the data which was dirty at the time
|
|
* the call was made get new I/O started against them. If wbc->sync_mode is
|
|
* WB_SYNC_ALL then we were called for data integrity and we must wait for
|
|
* existing IO to complete.
|
|
*
|
|
* To avoid livelocks (when other process dirties new pages), we first tag
|
|
* pages which should be written back with TOWRITE tag and only then start
|
|
* writing them. For data-integrity sync we have to be careful so that we do
|
|
* not miss some pages (e.g., because some other process has cleared TOWRITE
|
|
* tag we set). The rule we follow is that TOWRITE tag can be cleared only
|
|
* by the process clearing the DIRTY tag (and submitting the page for IO).
|
|
*
|
|
* To avoid deadlocks between range_cyclic writeback and callers that hold
|
|
* pages in PageWriteback to aggregate IO until write_cache_pages() returns,
|
|
* we do not loop back to the start of the file. Doing so causes a page
|
|
* lock/page writeback access order inversion - we should only ever lock
|
|
* multiple pages in ascending page->index order, and looping back to the start
|
|
* of the file violates that rule and causes deadlocks.
|
|
*/
|
|
int write_cache_pages(struct address_space *mapping,
|
|
struct writeback_control *wbc, writepage_t writepage,
|
|
void *data)
|
|
{
|
|
int ret = 0;
|
|
int done = 0;
|
|
int error;
|
|
struct pagevec pvec;
|
|
int nr_pages;
|
|
pgoff_t uninitialized_var(writeback_index);
|
|
pgoff_t index;
|
|
pgoff_t end; /* Inclusive */
|
|
pgoff_t done_index;
|
|
int range_whole = 0;
|
|
int tag;
|
|
|
|
pagevec_init(&pvec);
|
|
if (wbc->range_cyclic) {
|
|
writeback_index = mapping->writeback_index; /* prev offset */
|
|
index = writeback_index;
|
|
end = -1;
|
|
} else {
|
|
index = wbc->range_start >> PAGE_SHIFT;
|
|
end = wbc->range_end >> PAGE_SHIFT;
|
|
if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
|
|
range_whole = 1;
|
|
}
|
|
if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
|
|
tag = PAGECACHE_TAG_TOWRITE;
|
|
else
|
|
tag = PAGECACHE_TAG_DIRTY;
|
|
if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
|
|
tag_pages_for_writeback(mapping, index, end);
|
|
done_index = index;
|
|
while (!done && (index <= end)) {
|
|
int i;
|
|
|
|
nr_pages = pagevec_lookup_range_tag(&pvec, mapping, &index, end,
|
|
tag);
|
|
if (nr_pages == 0)
|
|
break;
|
|
|
|
for (i = 0; i < nr_pages; i++) {
|
|
struct page *page = pvec.pages[i];
|
|
|
|
done_index = page->index;
|
|
|
|
lock_page(page);
|
|
|
|
/*
|
|
* Page truncated or invalidated. We can freely skip it
|
|
* then, even for data integrity operations: the page
|
|
* has disappeared concurrently, so there could be no
|
|
* real expectation of this data interity operation
|
|
* even if there is now a new, dirty page at the same
|
|
* pagecache address.
|
|
*/
|
|
if (unlikely(page->mapping != mapping)) {
|
|
continue_unlock:
|
|
unlock_page(page);
|
|
continue;
|
|
}
|
|
|
|
if (!PageDirty(page)) {
|
|
/* someone wrote it for us */
|
|
goto continue_unlock;
|
|
}
|
|
|
|
if (PageWriteback(page)) {
|
|
if (wbc->sync_mode != WB_SYNC_NONE)
|
|
wait_on_page_writeback(page);
|
|
else
|
|
goto continue_unlock;
|
|
}
|
|
|
|
BUG_ON(PageWriteback(page));
|
|
if (!clear_page_dirty_for_io(page))
|
|
goto continue_unlock;
|
|
|
|
trace_wbc_writepage(wbc, inode_to_bdi(mapping->host));
|
|
error = (*writepage)(page, wbc, data);
|
|
if (unlikely(error)) {
|
|
/*
|
|
* Handle errors according to the type of
|
|
* writeback. There's no need to continue for
|
|
* background writeback. Just push done_index
|
|
* past this page so media errors won't choke
|
|
* writeout for the entire file. For integrity
|
|
* writeback, we must process the entire dirty
|
|
* set regardless of errors because the fs may
|
|
* still have state to clear for each page. In
|
|
* that case we continue processing and return
|
|
* the first error.
|
|
*/
|
|
if (error == AOP_WRITEPAGE_ACTIVATE) {
|
|
unlock_page(page);
|
|
error = 0;
|
|
} else if (wbc->sync_mode != WB_SYNC_ALL) {
|
|
ret = error;
|
|
done_index = page->index + 1;
|
|
done = 1;
|
|
break;
|
|
}
|
|
if (!ret)
|
|
ret = error;
|
|
}
|
|
|
|
/*
|
|
* We stop writing back only if we are not doing
|
|
* integrity sync. In case of integrity sync we have to
|
|
* keep going until we have written all the pages
|
|
* we tagged for writeback prior to entering this loop.
|
|
*/
|
|
if (--wbc->nr_to_write <= 0 &&
|
|
wbc->sync_mode == WB_SYNC_NONE) {
|
|
done = 1;
|
|
break;
|
|
}
|
|
}
|
|
pagevec_release(&pvec);
|
|
cond_resched();
|
|
}
|
|
|
|
/*
|
|
* If we hit the last page and there is more work to be done: wrap
|
|
* back the index back to the start of the file for the next
|
|
* time we are called.
|
|
*/
|
|
if (wbc->range_cyclic && !done)
|
|
done_index = 0;
|
|
if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
|
|
mapping->writeback_index = done_index;
|
|
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(write_cache_pages);
|
|
|
|
/*
|
|
* Function used by generic_writepages to call the real writepage
|
|
* function and set the mapping flags on error
|
|
*/
|
|
static int __writepage(struct page *page, struct writeback_control *wbc,
|
|
void *data)
|
|
{
|
|
struct address_space *mapping = data;
|
|
int ret = mapping->a_ops->writepage(page, wbc);
|
|
mapping_set_error(mapping, ret);
|
|
return ret;
|
|
}
|
|
|
|
/**
|
|
* generic_writepages - walk the list of dirty pages of the given address space and writepage() all of them.
|
|
* @mapping: address space structure to write
|
|
* @wbc: subtract the number of written pages from *@wbc->nr_to_write
|
|
*
|
|
* This is a library function, which implements the writepages()
|
|
* address_space_operation.
|
|
*/
|
|
int generic_writepages(struct address_space *mapping,
|
|
struct writeback_control *wbc)
|
|
{
|
|
struct blk_plug plug;
|
|
int ret;
|
|
|
|
/* deal with chardevs and other special file */
|
|
if (!mapping->a_ops->writepage)
|
|
return 0;
|
|
|
|
blk_start_plug(&plug);
|
|
ret = write_cache_pages(mapping, wbc, __writepage, mapping);
|
|
blk_finish_plug(&plug);
|
|
return ret;
|
|
}
|
|
|
|
EXPORT_SYMBOL(generic_writepages);
|
|
|
|
int do_writepages(struct address_space *mapping, struct writeback_control *wbc)
|
|
{
|
|
int ret;
|
|
|
|
if (wbc->nr_to_write <= 0)
|
|
return 0;
|
|
while (1) {
|
|
if (mapping->a_ops->writepages)
|
|
ret = mapping->a_ops->writepages(mapping, wbc);
|
|
else
|
|
ret = generic_writepages(mapping, wbc);
|
|
if ((ret != -ENOMEM) || (wbc->sync_mode != WB_SYNC_ALL))
|
|
break;
|
|
cond_resched();
|
|
congestion_wait(BLK_RW_ASYNC, HZ/50);
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
/**
|
|
* write_one_page - write out a single page and wait on I/O
|
|
* @page: the page to write
|
|
*
|
|
* The page must be locked by the caller and will be unlocked upon return.
|
|
*
|
|
* Note that the mapping's AS_EIO/AS_ENOSPC flags will be cleared when this
|
|
* function returns.
|
|
*/
|
|
int write_one_page(struct page *page)
|
|
{
|
|
struct address_space *mapping = page->mapping;
|
|
int ret = 0;
|
|
struct writeback_control wbc = {
|
|
.sync_mode = WB_SYNC_ALL,
|
|
.nr_to_write = 1,
|
|
};
|
|
|
|
BUG_ON(!PageLocked(page));
|
|
|
|
wait_on_page_writeback(page);
|
|
|
|
if (clear_page_dirty_for_io(page)) {
|
|
get_page(page);
|
|
ret = mapping->a_ops->writepage(page, &wbc);
|
|
if (ret == 0)
|
|
wait_on_page_writeback(page);
|
|
put_page(page);
|
|
} else {
|
|
unlock_page(page);
|
|
}
|
|
|
|
if (!ret)
|
|
ret = filemap_check_errors(mapping);
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(write_one_page);
|
|
|
|
/*
|
|
* For address_spaces which do not use buffers nor write back.
|
|
*/
|
|
int __set_page_dirty_no_writeback(struct page *page)
|
|
{
|
|
if (!PageDirty(page))
|
|
return !TestSetPageDirty(page);
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* Helper function for set_page_dirty family.
|
|
*
|
|
* Caller must hold lock_page_memcg().
|
|
*
|
|
* NOTE: This relies on being atomic wrt interrupts.
|
|
*/
|
|
void account_page_dirtied(struct page *page, struct address_space *mapping)
|
|
{
|
|
struct inode *inode = mapping->host;
|
|
|
|
trace_writeback_dirty_page(page, mapping);
|
|
|
|
if (mapping_cap_account_dirty(mapping)) {
|
|
struct bdi_writeback *wb;
|
|
|
|
inode_attach_wb(inode, page);
|
|
wb = inode_to_wb(inode);
|
|
|
|
__inc_lruvec_page_state(page, NR_FILE_DIRTY);
|
|
__inc_zone_page_state(page, NR_ZONE_WRITE_PENDING);
|
|
__inc_node_page_state(page, NR_DIRTIED);
|
|
inc_wb_stat(wb, WB_RECLAIMABLE);
|
|
inc_wb_stat(wb, WB_DIRTIED);
|
|
task_io_account_write(PAGE_SIZE);
|
|
current->nr_dirtied++;
|
|
this_cpu_inc(bdp_ratelimits);
|
|
}
|
|
}
|
|
EXPORT_SYMBOL(account_page_dirtied);
|
|
|
|
/*
|
|
* Helper function for deaccounting dirty page without writeback.
|
|
*
|
|
* Caller must hold lock_page_memcg().
|
|
*/
|
|
void account_page_cleaned(struct page *page, struct address_space *mapping,
|
|
struct bdi_writeback *wb)
|
|
{
|
|
if (mapping_cap_account_dirty(mapping)) {
|
|
dec_lruvec_page_state(page, NR_FILE_DIRTY);
|
|
dec_zone_page_state(page, NR_ZONE_WRITE_PENDING);
|
|
dec_wb_stat(wb, WB_RECLAIMABLE);
|
|
task_io_account_cancelled_write(PAGE_SIZE);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* For address_spaces which do not use buffers. Just tag the page as dirty in
|
|
* its radix tree.
|
|
*
|
|
* This is also used when a single buffer is being dirtied: we want to set the
|
|
* page dirty in that case, but not all the buffers. This is a "bottom-up"
|
|
* dirtying, whereas __set_page_dirty_buffers() is a "top-down" dirtying.
|
|
*
|
|
* The caller must ensure this doesn't race with truncation. Most will simply
|
|
* hold the page lock, but e.g. zap_pte_range() calls with the page mapped and
|
|
* the pte lock held, which also locks out truncation.
|
|
*/
|
|
int __set_page_dirty_nobuffers(struct page *page)
|
|
{
|
|
lock_page_memcg(page);
|
|
if (!TestSetPageDirty(page)) {
|
|
struct address_space *mapping = page_mapping(page);
|
|
unsigned long flags;
|
|
|
|
if (!mapping) {
|
|
unlock_page_memcg(page);
|
|
return 1;
|
|
}
|
|
|
|
xa_lock_irqsave(&mapping->i_pages, flags);
|
|
BUG_ON(page_mapping(page) != mapping);
|
|
WARN_ON_ONCE(!PagePrivate(page) && !PageUptodate(page));
|
|
account_page_dirtied(page, mapping);
|
|
radix_tree_tag_set(&mapping->i_pages, page_index(page),
|
|
PAGECACHE_TAG_DIRTY);
|
|
xa_unlock_irqrestore(&mapping->i_pages, flags);
|
|
unlock_page_memcg(page);
|
|
|
|
if (mapping->host) {
|
|
/* !PageAnon && !swapper_space */
|
|
__mark_inode_dirty(mapping->host, I_DIRTY_PAGES);
|
|
}
|
|
return 1;
|
|
}
|
|
unlock_page_memcg(page);
|
|
return 0;
|
|
}
|
|
EXPORT_SYMBOL(__set_page_dirty_nobuffers);
|
|
|
|
/*
|
|
* Call this whenever redirtying a page, to de-account the dirty counters
|
|
* (NR_DIRTIED, WB_DIRTIED, tsk->nr_dirtied), so that they match the written
|
|
* counters (NR_WRITTEN, WB_WRITTEN) in long term. The mismatches will lead to
|
|
* systematic errors in balanced_dirty_ratelimit and the dirty pages position
|
|
* control.
|
|
*/
|
|
void account_page_redirty(struct page *page)
|
|
{
|
|
struct address_space *mapping = page->mapping;
|
|
|
|
if (mapping && mapping_cap_account_dirty(mapping)) {
|
|
struct inode *inode = mapping->host;
|
|
struct bdi_writeback *wb;
|
|
struct wb_lock_cookie cookie = {};
|
|
|
|
wb = unlocked_inode_to_wb_begin(inode, &cookie);
|
|
current->nr_dirtied--;
|
|
dec_node_page_state(page, NR_DIRTIED);
|
|
dec_wb_stat(wb, WB_DIRTIED);
|
|
unlocked_inode_to_wb_end(inode, &cookie);
|
|
}
|
|
}
|
|
EXPORT_SYMBOL(account_page_redirty);
|
|
|
|
/*
|
|
* When a writepage implementation decides that it doesn't want to write this
|
|
* page for some reason, it should redirty the locked page via
|
|
* redirty_page_for_writepage() and it should then unlock the page and return 0
|
|
*/
|
|
int redirty_page_for_writepage(struct writeback_control *wbc, struct page *page)
|
|
{
|
|
int ret;
|
|
|
|
wbc->pages_skipped++;
|
|
ret = __set_page_dirty_nobuffers(page);
|
|
account_page_redirty(page);
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(redirty_page_for_writepage);
|
|
|
|
/*
|
|
* Dirty a page.
|
|
*
|
|
* For pages with a mapping this should be done under the page lock
|
|
* for the benefit of asynchronous memory errors who prefer a consistent
|
|
* dirty state. This rule can be broken in some special cases,
|
|
* but should be better not to.
|
|
*
|
|
* If the mapping doesn't provide a set_page_dirty a_op, then
|
|
* just fall through and assume that it wants buffer_heads.
|
|
*/
|
|
int set_page_dirty(struct page *page)
|
|
{
|
|
struct address_space *mapping = page_mapping(page);
|
|
|
|
page = compound_head(page);
|
|
if (likely(mapping)) {
|
|
int (*spd)(struct page *) = mapping->a_ops->set_page_dirty;
|
|
/*
|
|
* readahead/lru_deactivate_page could remain
|
|
* PG_readahead/PG_reclaim due to race with end_page_writeback
|
|
* About readahead, if the page is written, the flags would be
|
|
* reset. So no problem.
|
|
* About lru_deactivate_page, if the page is redirty, the flag
|
|
* will be reset. So no problem. but if the page is used by readahead
|
|
* it will confuse readahead and make it restart the size rampup
|
|
* process. But it's a trivial problem.
|
|
*/
|
|
if (PageReclaim(page))
|
|
ClearPageReclaim(page);
|
|
#ifdef CONFIG_BLOCK
|
|
if (!spd)
|
|
spd = __set_page_dirty_buffers;
|
|
#endif
|
|
return (*spd)(page);
|
|
}
|
|
if (!PageDirty(page)) {
|
|
if (!TestSetPageDirty(page))
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
EXPORT_SYMBOL(set_page_dirty);
|
|
|
|
/*
|
|
* set_page_dirty() is racy if the caller has no reference against
|
|
* page->mapping->host, and if the page is unlocked. This is because another
|
|
* CPU could truncate the page off the mapping and then free the mapping.
|
|
*
|
|
* Usually, the page _is_ locked, or the caller is a user-space process which
|
|
* holds a reference on the inode by having an open file.
|
|
*
|
|
* In other cases, the page should be locked before running set_page_dirty().
|
|
*/
|
|
int set_page_dirty_lock(struct page *page)
|
|
{
|
|
int ret;
|
|
|
|
lock_page(page);
|
|
ret = set_page_dirty(page);
|
|
unlock_page(page);
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(set_page_dirty_lock);
|
|
|
|
/*
|
|
* This cancels just the dirty bit on the kernel page itself, it does NOT
|
|
* actually remove dirty bits on any mmap's that may be around. It also
|
|
* leaves the page tagged dirty, so any sync activity will still find it on
|
|
* the dirty lists, and in particular, clear_page_dirty_for_io() will still
|
|
* look at the dirty bits in the VM.
|
|
*
|
|
* Doing this should *normally* only ever be done when a page is truncated,
|
|
* and is not actually mapped anywhere at all. However, fs/buffer.c does
|
|
* this when it notices that somebody has cleaned out all the buffers on a
|
|
* page without actually doing it through the VM. Can you say "ext3 is
|
|
* horribly ugly"? Thought you could.
|
|
*/
|
|
void __cancel_dirty_page(struct page *page)
|
|
{
|
|
struct address_space *mapping = page_mapping(page);
|
|
|
|
if (mapping_cap_account_dirty(mapping)) {
|
|
struct inode *inode = mapping->host;
|
|
struct bdi_writeback *wb;
|
|
struct wb_lock_cookie cookie = {};
|
|
|
|
lock_page_memcg(page);
|
|
wb = unlocked_inode_to_wb_begin(inode, &cookie);
|
|
|
|
if (TestClearPageDirty(page))
|
|
account_page_cleaned(page, mapping, wb);
|
|
|
|
unlocked_inode_to_wb_end(inode, &cookie);
|
|
unlock_page_memcg(page);
|
|
} else {
|
|
ClearPageDirty(page);
|
|
}
|
|
}
|
|
EXPORT_SYMBOL(__cancel_dirty_page);
|
|
|
|
/*
|
|
* Clear a page's dirty flag, while caring for dirty memory accounting.
|
|
* Returns true if the page was previously dirty.
|
|
*
|
|
* This is for preparing to put the page under writeout. We leave the page
|
|
* tagged as dirty in the radix tree so that a concurrent write-for-sync
|
|
* can discover it via a PAGECACHE_TAG_DIRTY walk. The ->writepage
|
|
* implementation will run either set_page_writeback() or set_page_dirty(),
|
|
* at which stage we bring the page's dirty flag and radix-tree dirty tag
|
|
* back into sync.
|
|
*
|
|
* This incoherency between the page's dirty flag and radix-tree tag is
|
|
* unfortunate, but it only exists while the page is locked.
|
|
*/
|
|
int clear_page_dirty_for_io(struct page *page)
|
|
{
|
|
struct address_space *mapping = page_mapping(page);
|
|
int ret = 0;
|
|
|
|
BUG_ON(!PageLocked(page));
|
|
|
|
if (mapping && mapping_cap_account_dirty(mapping)) {
|
|
struct inode *inode = mapping->host;
|
|
struct bdi_writeback *wb;
|
|
struct wb_lock_cookie cookie = {};
|
|
|
|
/*
|
|
* Yes, Virginia, this is indeed insane.
|
|
*
|
|
* We use this sequence to make sure that
|
|
* (a) we account for dirty stats properly
|
|
* (b) we tell the low-level filesystem to
|
|
* mark the whole page dirty if it was
|
|
* dirty in a pagetable. Only to then
|
|
* (c) clean the page again and return 1 to
|
|
* cause the writeback.
|
|
*
|
|
* This way we avoid all nasty races with the
|
|
* dirty bit in multiple places and clearing
|
|
* them concurrently from different threads.
|
|
*
|
|
* Note! Normally the "set_page_dirty(page)"
|
|
* has no effect on the actual dirty bit - since
|
|
* that will already usually be set. But we
|
|
* need the side effects, and it can help us
|
|
* avoid races.
|
|
*
|
|
* We basically use the page "master dirty bit"
|
|
* as a serialization point for all the different
|
|
* threads doing their things.
|
|
*/
|
|
if (page_mkclean(page))
|
|
set_page_dirty(page);
|
|
/*
|
|
* We carefully synchronise fault handlers against
|
|
* installing a dirty pte and marking the page dirty
|
|
* at this point. We do this by having them hold the
|
|
* page lock while dirtying the page, and pages are
|
|
* always locked coming in here, so we get the desired
|
|
* exclusion.
|
|
*/
|
|
wb = unlocked_inode_to_wb_begin(inode, &cookie);
|
|
if (TestClearPageDirty(page)) {
|
|
dec_lruvec_page_state(page, NR_FILE_DIRTY);
|
|
dec_zone_page_state(page, NR_ZONE_WRITE_PENDING);
|
|
dec_wb_stat(wb, WB_RECLAIMABLE);
|
|
ret = 1;
|
|
}
|
|
unlocked_inode_to_wb_end(inode, &cookie);
|
|
return ret;
|
|
}
|
|
return TestClearPageDirty(page);
|
|
}
|
|
EXPORT_SYMBOL(clear_page_dirty_for_io);
|
|
|
|
int test_clear_page_writeback(struct page *page)
|
|
{
|
|
struct address_space *mapping = page_mapping(page);
|
|
struct mem_cgroup *memcg;
|
|
struct lruvec *lruvec;
|
|
int ret;
|
|
|
|
memcg = lock_page_memcg(page);
|
|
lruvec = mem_cgroup_page_lruvec(page, page_pgdat(page));
|
|
if (mapping && mapping_use_writeback_tags(mapping)) {
|
|
struct inode *inode = mapping->host;
|
|
struct backing_dev_info *bdi = inode_to_bdi(inode);
|
|
unsigned long flags;
|
|
|
|
xa_lock_irqsave(&mapping->i_pages, flags);
|
|
ret = TestClearPageWriteback(page);
|
|
if (ret) {
|
|
radix_tree_tag_clear(&mapping->i_pages, page_index(page),
|
|
PAGECACHE_TAG_WRITEBACK);
|
|
if (bdi_cap_account_writeback(bdi)) {
|
|
struct bdi_writeback *wb = inode_to_wb(inode);
|
|
|
|
dec_wb_stat(wb, WB_WRITEBACK);
|
|
__wb_writeout_inc(wb);
|
|
}
|
|
}
|
|
|
|
if (mapping->host && !mapping_tagged(mapping,
|
|
PAGECACHE_TAG_WRITEBACK))
|
|
sb_clear_inode_writeback(mapping->host);
|
|
|
|
xa_unlock_irqrestore(&mapping->i_pages, flags);
|
|
} else {
|
|
ret = TestClearPageWriteback(page);
|
|
}
|
|
/*
|
|
* NOTE: Page might be free now! Writeback doesn't hold a page
|
|
* reference on its own, it relies on truncation to wait for
|
|
* the clearing of PG_writeback. The below can only access
|
|
* page state that is static across allocation cycles.
|
|
*/
|
|
if (ret) {
|
|
dec_lruvec_state(lruvec, NR_WRITEBACK);
|
|
dec_zone_page_state(page, NR_ZONE_WRITE_PENDING);
|
|
inc_node_page_state(page, NR_WRITTEN);
|
|
}
|
|
__unlock_page_memcg(memcg);
|
|
return ret;
|
|
}
|
|
|
|
int __test_set_page_writeback(struct page *page, bool keep_write)
|
|
{
|
|
struct address_space *mapping = page_mapping(page);
|
|
int ret;
|
|
|
|
lock_page_memcg(page);
|
|
if (mapping && mapping_use_writeback_tags(mapping)) {
|
|
struct inode *inode = mapping->host;
|
|
struct backing_dev_info *bdi = inode_to_bdi(inode);
|
|
unsigned long flags;
|
|
|
|
xa_lock_irqsave(&mapping->i_pages, flags);
|
|
ret = TestSetPageWriteback(page);
|
|
if (!ret) {
|
|
bool on_wblist;
|
|
|
|
on_wblist = mapping_tagged(mapping,
|
|
PAGECACHE_TAG_WRITEBACK);
|
|
|
|
radix_tree_tag_set(&mapping->i_pages, page_index(page),
|
|
PAGECACHE_TAG_WRITEBACK);
|
|
if (bdi_cap_account_writeback(bdi))
|
|
inc_wb_stat(inode_to_wb(inode), WB_WRITEBACK);
|
|
|
|
/*
|
|
* We can come through here when swapping anonymous
|
|
* pages, so we don't necessarily have an inode to track
|
|
* for sync.
|
|
*/
|
|
if (mapping->host && !on_wblist)
|
|
sb_mark_inode_writeback(mapping->host);
|
|
}
|
|
if (!PageDirty(page))
|
|
radix_tree_tag_clear(&mapping->i_pages, page_index(page),
|
|
PAGECACHE_TAG_DIRTY);
|
|
if (!keep_write)
|
|
radix_tree_tag_clear(&mapping->i_pages, page_index(page),
|
|
PAGECACHE_TAG_TOWRITE);
|
|
xa_unlock_irqrestore(&mapping->i_pages, flags);
|
|
} else {
|
|
ret = TestSetPageWriteback(page);
|
|
}
|
|
if (!ret) {
|
|
inc_lruvec_page_state(page, NR_WRITEBACK);
|
|
inc_zone_page_state(page, NR_ZONE_WRITE_PENDING);
|
|
}
|
|
unlock_page_memcg(page);
|
|
return ret;
|
|
|
|
}
|
|
EXPORT_SYMBOL(__test_set_page_writeback);
|
|
|
|
/*
|
|
* Return true if any of the pages in the mapping are marked with the
|
|
* passed tag.
|
|
*/
|
|
int mapping_tagged(struct address_space *mapping, int tag)
|
|
{
|
|
return radix_tree_tagged(&mapping->i_pages, tag);
|
|
}
|
|
EXPORT_SYMBOL(mapping_tagged);
|
|
|
|
/**
|
|
* wait_for_stable_page() - wait for writeback to finish, if necessary.
|
|
* @page: The page to wait on.
|
|
*
|
|
* This function determines if the given page is related to a backing device
|
|
* that requires page contents to be held stable during writeback. If so, then
|
|
* it will wait for any pending writeback to complete.
|
|
*/
|
|
void wait_for_stable_page(struct page *page)
|
|
{
|
|
if (bdi_cap_stable_pages_required(inode_to_bdi(page->mapping->host)))
|
|
wait_on_page_writeback(page);
|
|
}
|
|
EXPORT_SYMBOL_GPL(wait_for_stable_page);
|