From patchwork Thu Aug 1 12:58:45 2024 Content-Type: text/plain; charset="utf-8" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit X-Patchwork-Submitter: Alice Ryhl X-Patchwork-Id: 13750397 Return-Path: X-Spam-Checker-Version: SpamAssassin 3.4.0 (2014-02-07) on aws-us-west-2-korg-lkml-1.web.codeaurora.org Received: from kanga.kvack.org (kanga.kvack.org [205.233.56.17]) by smtp.lore.kernel.org (Postfix) with ESMTP id 2BB2CC52D6D for ; Thu, 1 Aug 2024 12:59:22 +0000 (UTC) Received: by kanga.kvack.org (Postfix) id 266B58D0002; Thu, 1 Aug 2024 08:59:20 -0400 (EDT) Received: by kanga.kvack.org (Postfix, from userid 40) id 1ED8A8D0003; Thu, 1 Aug 2024 08:59:20 -0400 (EDT) X-Delivered-To: int-list-linux-mm@kvack.org Received: by kanga.kvack.org (Postfix, from userid 63042) id F0DF48D0002; Thu, 1 Aug 2024 08:59:19 -0400 (EDT) X-Delivered-To: linux-mm@kvack.org Received: from relay.hostedemail.com (smtprelay0015.hostedemail.com [216.40.44.15]) by kanga.kvack.org (Postfix) with ESMTP id AB3D08D0003 for ; Thu, 1 Aug 2024 08:59:19 -0400 (EDT) Received: from smtpin04.hostedemail.com (a10.router.float.18 [10.200.18.1]) by unirelay05.hostedemail.com (Postfix) with ESMTP id 5E8E740D6E for ; Thu, 1 Aug 2024 12:59:19 +0000 (UTC) X-FDA: 82403682438.04.D4A4CC0 Received: from mail-yw1-f201.google.com (mail-yw1-f201.google.com [209.85.128.201]) by imf15.hostedemail.com (Postfix) with ESMTP id 52C07A0031 for ; Thu, 1 Aug 2024 12:59:17 +0000 (UTC) Authentication-Results: imf15.hostedemail.com; dkim=pass header.d=google.com header.s=20230601 header.b=MefO4DyN; dmarc=pass (policy=reject) header.from=google.com; spf=pass (imf15.hostedemail.com: domain of 3pIarZgkKCJs5GD79MTCGBJJBG9.7JHGDIPS-HHFQ57F.JMB@flex--aliceryhl.bounces.google.com designates 209.85.128.201 as permitted sender) smtp.mailfrom=3pIarZgkKCJs5GD79MTCGBJJBG9.7JHGDIPS-HHFQ57F.JMB@flex--aliceryhl.bounces.google.com ARC-Message-Signature: i=1; a=rsa-sha256; c=relaxed/relaxed; d=hostedemail.com; s=arc-20220608; t=1722517093; h=from:from:sender:reply-to:subject:subject:date:date: message-id:message-id:to:to:cc:cc:mime-version:mime-version: content-type:content-type:content-transfer-encoding:in-reply-to: references:dkim-signature; bh=xxA2fCXKE5KBGGNtdnUoORo22MS2ojxsGgbLjdqr3r8=; b=q2fb2PJTC+1XSRb6Yif+oMSQVo31KzlGXYFHQkg5Y8vxqePu3VxDCSsqrehT3o2lbQifVt uV5RgCV6E6n/qoDZFzBvhG6BuqhnTVSM9+NJ9PYrsvdsxmty7ZuoaenD9eFPGI1S535xQy hRr3Ll5zseIuJJYzEB4h7vVe4/ijcmk= ARC-Seal: i=1; s=arc-20220608; d=hostedemail.com; t=1722517093; a=rsa-sha256; cv=none; b=R9tMAdvz64m5n8QUQh+dQtlft4DB6IuhJy71Ze2zmrrvvDAZwynUMUEEcrBE4FoKNZEvdp wOd1eKS6Ci5iUgVUzrU3reG4InhkRBKlfS9iKsrH/OB+uoT195b+mXpLaE0n9NzupTyBPs zOBrQeRdeSLSgo4e76/NRfGF5zduj1w= ARC-Authentication-Results: i=1; imf15.hostedemail.com; dkim=pass header.d=google.com header.s=20230601 header.b=MefO4DyN; dmarc=pass (policy=reject) header.from=google.com; spf=pass (imf15.hostedemail.com: domain of 3pIarZgkKCJs5GD79MTCGBJJBG9.7JHGDIPS-HHFQ57F.JMB@flex--aliceryhl.bounces.google.com designates 209.85.128.201 as permitted sender) smtp.mailfrom=3pIarZgkKCJs5GD79MTCGBJJBG9.7JHGDIPS-HHFQ57F.JMB@flex--aliceryhl.bounces.google.com Received: by mail-yw1-f201.google.com with SMTP id 00721157ae682-66b3b4415c7so147058987b3.0 for ; Thu, 01 Aug 2024 05:59:17 -0700 (PDT) DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/relaxed; d=google.com; s=20230601; t=1722517156; x=1723121956; darn=kvack.org; h=cc:to:from:subject:message-id:mime-version:date:from:to:cc:subject :date:message-id:reply-to; bh=xxA2fCXKE5KBGGNtdnUoORo22MS2ojxsGgbLjdqr3r8=; b=MefO4DyNLfx49qNsIxuGaCnV7oKRxSwGejIyMnvNN6w4nIriY98xh/vCX89EWysvT0 KJEmHggK1CzyqfAvKiN2X1bs2Q5AdEg0dk9gm/aoWYMHfVell+faCNtuDGtMA/BklLCm jLt+J1xQr4M6ReZKmNXTBS3RO/BirRNM6eLwOgJBXUdZFNQ0l8HrMtDIq1cuHI3LYZeb UDADvBUy8skh+N7dSXIDbqMh6vD4PVrN/iJKht46Wj7t6bXzUVJCwxX9EUYpbmB35wNf uc/RsHUMP6WCu9L7s0iahIBZltK6DiD4N4eFn6gpqaaTk1J0E48hYkQjnVPXfUSCv9bT 2+AA== X-Google-DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/relaxed; d=1e100.net; s=20230601; t=1722517156; x=1723121956; h=cc:to:from:subject:message-id:mime-version:date:x-gm-message-state :from:to:cc:subject:date:message-id:reply-to; bh=xxA2fCXKE5KBGGNtdnUoORo22MS2ojxsGgbLjdqr3r8=; b=OXDJrg8AKeKQzNAACsevm2yRwEU3J825Sc3o7cjpKiPzZG8lJw9J4Ir1loVyl7fPWc iWYDHOqkuortgodznoQAYA2ikQNal7ZRkXnUxGoL8SuY39t8+Zkd9qDOrakIDYKDsUHY hXZGP01gKFWnfYvhI2DpVln3Mtn+ZJx4JfjbDlKEU58lFEYHYVrt1gpfi8JV43YNC6Hp /acomC7/K98AqvhFWiPfalzjYVvhX98P6v7DQpGKZDMs5GgTDvCQaXwX9jy0kvDyCq5P euFZe5NKAy9LcYSO8bWrbut0/OoxRB1jrqEu8LWC6dNLDa8w2aTvO+bkRhW7ar7GBB63 194w== X-Forwarded-Encrypted: i=1; AJvYcCXWQdwWLKJS4WG3MZqmx/7vSsWtvlSK8WqXJDv2OIAmxRpafm8NPLFi9CG1oACGI78mKAxQ9CCBw92T28tKNHY2IAc= X-Gm-Message-State: AOJu0YwCQgcoKsLCBIH2RhI8WVY1OL/OhdjOO4ep4jb7RK4asKXyVJqk LW2SzIpJ1eVHsd+sNg9jzMe5yC5EKM/0yqg9Vv6mdGxMOuD8Om7m7KSgKOzDAxals4jktm4deLA DF+EPXbYpSVSIJA== X-Google-Smtp-Source: AGHT+IEcxeDbjrGJlRvM72kLOIQ7Fjsbv03a67VH4A+GnwzM9myj32at779cCfdLWb9D9EJq4Lk52HefjjyijII= X-Received: from aliceryhl.c.googlers.com ([fda3:e722:ac3:cc00:28:9cb1:c0a8:35bd]) (user=aliceryhl job=sendgmr) by 2002:a05:690c:dce:b0:648:db87:13d8 with SMTP id 00721157ae682-6874abdccbamr1002497b3.2.1722517156123; Thu, 01 Aug 2024 05:59:16 -0700 (PDT) Date: Thu, 01 Aug 2024 12:58:45 +0000 Mime-Version: 1.0 X-B4-Tracking: v=1; b=H4sIAISGq2YC/1WMwQ6DIBAFf8XsuTSylKg99T+aHhAWJalioCFtD P9etJd6nJc3s0Kk4CjCtVohUHLR+bmAOFWgRzUPxJwpDFjjpW5QsDQpZtua8852thcSynMJZN1 7r9wfhUcXXz589mji23r0E2ecCVRGqhJqiW6D98OTztpPsAUS/kvNT8IiqV6Q7LAxWqiDlHP+A tQaqJXMAAAA X-Developer-Key: i=aliceryhl@google.com; a=openpgp; fpr=49F6C1FAA74960F43A5B86A1EE7A392FDE96209F X-Developer-Signature: v=1; a=openpgp-sha256; l=23584; i=aliceryhl@google.com; h=from:subject:message-id; bh=1t6f11NqfF344Xk17yIlFm1UXlZ1e6LTjfViMW67EdI=; b=owEBbQKS/ZANAwAKAQRYvu5YxjlGAcsmYgBmq4aH/lZX6rWmfEllfsStMCTvdSSwepj+rXpI5 P6bhGtga1SJAjMEAAEKAB0WIQSDkqKUTWQHCvFIvbIEWL7uWMY5RgUCZquGhwAKCRAEWL7uWMY5 RkoWEAC7eziY0EhHqin68KQXZmrdF4jL6sxQCSzuO0/LitbPIznD+EALvK3AhR+//WdvCcXSPQ/ 5lyA4ayi3EjnlSassJ97AaAMXHpR0nIUgp1D0d5FlO/pDFEzjXuSdjJ4NdK5sVMP4m22M4DFthI /mvtD5mob0hRM+ZFBaDaL13oYG6zEtNdTj2tV4fi/adEA849VUggyqmdufUd6jP0IGqryDey6Wx lLsD9FJxUBa71A/lmnuwq7PMYlaIeUN15rHROHyshj3azqF0sh7HbNDXTjc+M0f1r3l6y3wp2ZK a0EIYO8Qop1iH0hxxeShSZXRe65d4ObSYvVjDEsfLOA2c/lVrbDz75CLUOXGPcDz8g7af31eqJs urmPeGdpR9O3eACoXsv4cb4X/ak2ek1SfqWOT2bHnKxvR12Pr0qqXOlH/qbDEDT587sqa6ZS9Pg 4fld0vX712ceHat/GY2Fu/5cXnAQX3lqmMZh0//mGiyTXYGZnH4oQHLfggAOxj9Cv985HOhEUrG hf02fFvBxXdq2lCiNxuXo2hpjcgxPwUjjGx+5qev91Bqo+ABs7Oo3LyCSI+hZ0oFeHaL0qq5Obq 6RwLGDfy6TZLFflIrquwr91iAmbGeftBGG9Pk4MV0gRA7wCtlFnjeruKV2yLi8uOqOA19K2TCiV /DoHWtzqlEUdI9A== X-Mailer: b4 0.13.0 Message-ID: <20240801-vma-v3-1-db6c1c0afda9@google.com> Subject: [PATCH v3] rust: mm: add abstractions for mm_struct and vm_area_struct From: Alice Ryhl To: Miguel Ojeda , Andrew Morton Cc: Alex Gaynor , Wedson Almeida Filho , Boqun Feng , Gary Guo , " =?utf-8?q?Bj=C3=B6rn_Roy_Baron?= " , Benno Lossin , Andreas Hindborg , Matthew Wilcox , "Liam R. Howlett" , Vlastimil Babka , Lorenzo Stoakes , linux-kernel@vger.kernel.org, linux-mm@kvack.org, rust-for-linux@vger.kernel.org, Alice Ryhl X-Rspamd-Server: rspam07 X-Rspamd-Queue-Id: 52C07A0031 X-Stat-Signature: seeb1mk6nf1d3gqnomhxyeqpjqbbhtg1 X-Rspam-User: X-HE-Tag: 1722517157-745447 X-HE-Meta: U2FsdGVkX1/aurjdlhwVbUD4GW1WPq7wxBJHuFJ5AY/6YHY7pez5t9WMSBL8B8VssB5Dq/FciRxzStPJ+IFh4FLBMuU4+yala62hDkmt0EjUXcrJGFlXLBCbB+afk1rJWy3dYhLpe6+udgNDCX5tPIweJzOrcZfCiK42a/KH+Gfqys0enuEpUlXHQVd3poakMjUBJUUZDiRcxEQkVRvPoTsnO9Cw+APNhBhimPMMpvY1hzHpvwbJa9gC8CvRaVJ9nia91BIVMnx7huE5LugjXnx4zATe3xbZzvAPN4XXnUGQSzpNbh4LIT29+tU890h3hdZJJW880/mVevqI4pNjKw64qrAVuAkI59zVuE78iYMTmm/3CoMv0Q5LSdug9J8wmPW3q3d4jnok6XP24EqwAF0QatfV4Aujt8f4sg3XKh698TMvahSGxLhmJxO2GvphVK5sXxLkCT1t9j/O3kDyxxT9I5dxALb/XP2lSjbaZcioZMFWPxwg/DBuWHfLLBAxFtCoKp76pJoO9HG9mh82h05igQHlwZCfztTj/0ogfPVNh0TTEQZM+eJXz+VuJ+6v9luv1CWn/bRb6IiWlHER0RJII+uIgZ/LZ739wPliZMqnzECxigMpD2z/ddMYHAHj6pRAsRkvlJ/wEXUAISGHqrXe/YqCwN7q4JSdk6pstVmKddN00rONa5nAUtl5YYHg/U8aO2FhWIiaXDqmu6enzGTSL69hZjD6q1rQqEeyiew1MYrY7Kog2gJn8HQwe/rV7Nuv1QYqCBIpXXJEvDPY9i5srwMHTuhjaYx8ZGD7j9sPaZ3MKcLRi5GaFPiiNsc5DSmIr+EGU6BpcmIrRtij7c4nBN55ctttVQxow3JeK3/s3fELt7pXzSNBeDGEv7QnE9kig4b2n6KlV3ioSvosB4O6/FquA/SHjK0hh9qypu1SEP7hIj6YGlkMcn/sxTEQjJKVRXtesx1YMOoUqBt P3jOYCDe 8PzQ5U3PvW/ep5LPV2dkKHzA4naNeN+w9Le3Q9yv81aZoF8KFp/GmFfiiymAwKEO6upgckM6ZcUfYYJCyvABCqBgqFp6SLGLZlAcgpVJF2XTyaKl1g89LDsM9AsUJQ8vH/WGZwNhKtwb3Dq4xAPJZKTnEJczLZbw62uLFUOc7V73S7hP96um7FEBclMjZGCppqvvHS33zPHOMzDFujO2gZsC51Py79QqFrYs0rOHl+Dd0VZSJcFto16oKGdYuZcG7laP0ELymPqdW3EQQNK3b4E3h1flYZHHeE0He+5hv5ghgsaDJtFAuPyp5mgAnWn3mK9FFwBjqeAQ6h6WqsG/9cH0KN2kfI2xijCCOMSN6O8hauh6SplOhAV6eOQYKi50uT2iADYW0eT3j1xahiarpX7fv1sYyQR/oZBCCVdNTmkBz31Kj0h8zVvKoBlGMq9asoSvie/yPS3kxjqIlLgamivc0l6x+uB1QEANiWa69bjR2rkXQhglWin7J6UO65gVMvU2JNYLpbZlI8sNIGqnlGXRgO1/lxGgzcU1hqLQ33EdaM/v3VuBBB+5Ww7H0Hq6qNqGYX1OmN84KxiDP41f42NpVOaIpfNgqILRw2atQEYNqgDXRXvu7u2+TRAknTci6nFMRck6154DDGqouVQXL3JbiNtUh6qfJjXtlOpCA+XE4DVHl/b7bbBTbgNxdD+9KVcID57WGWvMKYMnQlwgRzPJStO5oUVxnuJoA5whuaLF4jMWgVyTXvzVcQ8qDHdkPGTQM33XxxiuSl6U= X-Bogosity: Ham, tests=bogofilter, spamicity=0.000002, version=1.2.4 Sender: owner-linux-mm@kvack.org Precedence: bulk X-Loop: owner-majordomo@kvack.org List-ID: List-Subscribe: List-Unsubscribe: This is a follow-up to the page abstractions [1] that were recently merged in 6.11. Rust Binder will need these abstractions to manipulate the vma in its implementation of the mmap fop on the Binder file. This patch is based on Wedson's implementation on the old rust branch, but has been changed significantly. All mistakes are Alice's. Link: https://lore.kernel.org/r/20240528-alice-mm-v7-4-78222c31b8f4@google.com [1] Co-developed-by: Wedson Almeida Filho Signed-off-by: Wedson Almeida Filho Signed-off-by: Alice Ryhl --- Changes in v3: - Reorder entries in mm.rs. - Use ARef for mmput_async helper. - Clarify that VmArea requires you to hold the mmap read or write lock. - Link to v2: https://lore.kernel.org/r/20240727-vma-v2-1-ab3e5927dc3a@google.com Changes in v2: - mm.rs is redesigned from scratch making use of AsRef - Add notes about whether destructors may sleep - Rename Area to VmArea - Link to v1: https://lore.kernel.org/r/20240723-vma-v1-1-32ad5a0118ee@google.com --- rust/helpers.c | 61 +++++++++ rust/kernel/lib.rs | 1 + rust/kernel/mm.rs | 337 +++++++++++++++++++++++++++++++++++++++++++++++++ rust/kernel/mm/virt.rs | 204 ++++++++++++++++++++++++++++++ rust/kernel/types.rs | 9 ++ 5 files changed, 612 insertions(+) --- base-commit: 8400291e289ee6b2bf9779ff1c83a291501f017b change-id: 20240723-vma-f80119f9fb35 Best regards, diff --git a/rust/helpers.c b/rust/helpers.c index 92d3c03ae1bd..97300f34505f 100644 --- a/rust/helpers.c +++ b/rust/helpers.c @@ -200,6 +200,67 @@ rust_helper_krealloc(const void *objp, size_t new_size, gfp_t flags) } EXPORT_SYMBOL_GPL(rust_helper_krealloc); +void rust_helper_mmgrab(struct mm_struct *mm) +{ + mmgrab(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmgrab); + +void rust_helper_mmdrop(struct mm_struct *mm) +{ + mmdrop(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmdrop); + +void rust_helper_mmget(struct mm_struct *mm) +{ + mmget(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmget); + +bool rust_helper_mmget_not_zero(struct mm_struct *mm) +{ + return mmget_not_zero(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmget_not_zero); + +void rust_helper_mmap_read_lock(struct mm_struct *mm) +{ + mmap_read_lock(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmap_read_lock); + +bool rust_helper_mmap_read_trylock(struct mm_struct *mm) +{ + return mmap_read_trylock(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmap_read_trylock); + +void rust_helper_mmap_read_unlock(struct mm_struct *mm) +{ + mmap_read_unlock(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmap_read_unlock); + +void rust_helper_mmap_write_lock(struct mm_struct *mm) +{ + mmap_write_lock(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmap_write_lock); + +void rust_helper_mmap_write_unlock(struct mm_struct *mm) +{ + mmap_write_unlock(mm); +} +EXPORT_SYMBOL_GPL(rust_helper_mmap_write_unlock); + +struct vm_area_struct *rust_helper_vma_lookup(struct mm_struct *mm, + unsigned long addr) +{ + return vma_lookup(mm, addr); +} +EXPORT_SYMBOL_GPL(rust_helper_vma_lookup); + /* * `bindgen` binds the C `size_t` type as the Rust `usize` type, so we can * use it in contexts where Rust expects a `usize` like slice (array) indices. diff --git a/rust/kernel/lib.rs b/rust/kernel/lib.rs index 274bdc1b0a82..6c8bac65845e 100644 --- a/rust/kernel/lib.rs +++ b/rust/kernel/lib.rs @@ -38,6 +38,7 @@ pub mod ioctl; #[cfg(CONFIG_KUNIT)] pub mod kunit; +pub mod mm; #[cfg(CONFIG_NET)] pub mod net; pub mod page; diff --git a/rust/kernel/mm.rs b/rust/kernel/mm.rs new file mode 100644 index 000000000000..ed2db893fb79 --- /dev/null +++ b/rust/kernel/mm.rs @@ -0,0 +1,337 @@ +// SPDX-License-Identifier: GPL-2.0 + +// Copyright (C) 2024 Google LLC. + +//! Memory management. +//! +//! C header: [`include/linux/mm.h`](../../../../include/linux/mm.h) + +use crate::{ + bindings, + types::{ARef, AlwaysRefCounted, Opaque}, +}; + +use core::{ + ops::Deref, + ptr::{self, NonNull}, +}; + +pub mod virt; + +/// A wrapper for the kernel's `struct mm_struct`. +/// +/// Since `mm_users` may be zero, the associated address space may not exist anymore. You must use +/// [`mmget_not_zero`] before accessing the address space. +/// +/// The `ARef` smart pointer holds an `mmgrab` refcount. Its destructor may sleep. +/// +/// # Invariants +/// +/// Values of this type are always refcounted. +/// +/// [`mmget_not_zero`]: Mm::mmget_not_zero +pub struct Mm { + mm: Opaque, +} + +// SAFETY: It is safe to call `mmdrop` on another thread than where `mmgrab` was called. +unsafe impl Send for Mm {} +// SAFETY: All methods on `Mm` can be called in parallel from several threads. +unsafe impl Sync for Mm {} + +// SAFETY: By the type invariants, this type is always refcounted. +unsafe impl AlwaysRefCounted for Mm { + fn inc_ref(&self) { + // SAFETY: The pointer is valid since self is a reference. + unsafe { bindings::mmgrab(self.as_raw()) }; + } + + unsafe fn dec_ref(obj: NonNull) { + // SAFETY: The caller is giving up their refcount. + unsafe { bindings::mmdrop(obj.cast().as_ptr()) }; + } +} + +/// A wrapper for the kernel's `struct mm_struct`. +/// +/// This type is used only when `mm_users` is known to be non-zero at compile-time. It can be used +/// to access the associated address space. +/// +/// The `ARef` smart pointer holds an `mmget` refcount. Its destructor may sleep. +/// +/// # Invariants +/// +/// Values of this type are always refcounted. The value of `mm_users` is non-zero. +#[repr(transparent)] +pub struct MmWithUser { + mm: Mm, +} + +// SAFETY: It is safe to call `mmput` on another thread than where `mmget` was called. +unsafe impl Send for MmWithUser {} +// SAFETY: All methods on `MmWithUser` can be called in parallel from several threads. +unsafe impl Sync for MmWithUser {} + +// SAFETY: By the type invariants, this type is always refcounted. +unsafe impl AlwaysRefCounted for MmWithUser { + fn inc_ref(&self) { + // SAFETY: The pointer is valid since self is a reference. + unsafe { bindings::mmget(self.as_raw()) }; + } + + unsafe fn dec_ref(obj: NonNull) { + // SAFETY: The caller is giving up their refcount. + unsafe { bindings::mmput(obj.cast().as_ptr()) }; + } +} + +// Make all `Mm` methods available on `MmWithUser`. +impl Deref for MmWithUser { + type Target = Mm; + + #[inline] + fn deref(&self) -> &Mm { + &self.mm + } +} + +/// A wrapper for the kernel's `struct mm_struct`. +/// +/// This type is identical to `MmWithUser` except that it uses `mmput_async` when dropping a +/// refcount. This means that the destructor of `ARef` is safe to call in atomic +/// context. +#[repr(transparent)] +pub struct MmWithUserAsync { + mm: MmWithUser, +} + +// SAFETY: It is safe to call `mmput_async` on another thread than where `mmget` was called. +unsafe impl Send for MmWithUserAsync {} +// SAFETY: All methods on `MmWithUserAsync` can be called in parallel from several threads. +unsafe impl Sync for MmWithUserAsync {} + +// SAFETY: By the type invariants, this type is always refcounted. +unsafe impl AlwaysRefCounted for MmWithUserAsync { + fn inc_ref(&self) { + // SAFETY: The pointer is valid since self is a reference. + unsafe { bindings::mmget(self.as_raw()) }; + } + + unsafe fn dec_ref(obj: NonNull) { + // SAFETY: The caller is giving up their refcount. + unsafe { bindings::mmput_async(obj.cast().as_ptr()) }; + } +} + +// Make all `MmWithUser` methods available on `MmWithUserAsync`. +impl Deref for MmWithUserAsync { + type Target = MmWithUser; + + #[inline] + fn deref(&self) -> &MmWithUser { + &self.mm + } +} + +// These methods are safe to call even if `mm_users` is zero. +impl Mm { + /// Call `mmgrab` on `current.mm`. + #[inline] + pub fn mmgrab_current() -> Option> { + // SAFETY: It's safe to get the `mm` field from current. + let mm = unsafe { + let current = bindings::get_current(); + (*current).mm + }; + + let mm = NonNull::new(mm)?; + + // SAFETY: We just checked that `mm` is not null. + unsafe { bindings::mmgrab(mm.as_ptr()) }; + + // SAFETY: We just created an `mmgrab` refcount. Layouts are compatible due to + // repr(transparent). + Some(unsafe { ARef::from_raw(mm.cast()) }) + } + + /// Returns a raw pointer to the inner `mm_struct`. + #[inline] + pub fn as_raw(&self) -> *mut bindings::mm_struct { + self.mm.get() + } + + /// Obtain a reference from a raw pointer. + /// + /// # Safety + /// + /// The caller must ensure that `ptr` points at an `mm_struct`, and that it is not deallocated + /// during the lifetime 'a. + #[inline] + pub unsafe fn from_raw_mm<'a>(ptr: *const bindings::mm_struct) -> &'a Mm { + // SAFETY: Caller promises that the pointer is valid for 'a. Layouts are compatible due to + // repr(transparent). + unsafe { &*ptr.cast() } + } + + /// Check whether this vma is associated with this mm. + #[inline] + pub fn is_same_mm(&self, area: &virt::VmArea) -> bool { + // SAFETY: The `vm_mm` field of the area is immutable, so we can read it without + // synchronization. + let vm_mm = unsafe { (*area.as_ptr()).vm_mm }; + + ptr::eq(vm_mm, self.as_raw()) + } + + /// Calls `mmget_not_zero` and returns a handle if it succeeds. + #[inline] + pub fn mmget_not_zero(&self) -> Option> { + // SAFETY: The pointer is valid since self is a reference. + let success = unsafe { bindings::mmget_not_zero(self.as_raw()) }; + + if success { + // SAFETY: We just created an `mmget` refcount. + Some(unsafe { ARef::from_raw(NonNull::new_unchecked(self.as_raw().cast())) }) + } else { + None + } + } +} + +// These methods require `mm_users` to be non-zero. +impl MmWithUser { + /// Obtain a reference from a raw pointer. + /// + /// # Safety + /// + /// The caller must ensure that `ptr` points at an `mm_struct`, and that `mm_users` remains + /// non-zero for the duration of the lifetime 'a. + #[inline] + pub unsafe fn from_raw_mm<'a>(ptr: *const bindings::mm_struct) -> &'a MmWithUser { + // SAFETY: Caller promises that the pointer is valid for 'a. The layout is compatible due + // to repr(transparent). + unsafe { &*ptr.cast() } + } + + /// Use `mmput_async` when dropping this refcount. + pub fn use_mmput_async(me: ARef) -> ARef { + // SAFETY: The layouts and invariants are compatible. + unsafe { ARef::from_raw(ARef::into_raw(me).cast()) } + } + + /// Lock the mmap write lock. + #[inline] + pub fn mmap_write_lock(&self) -> MmapWriteLock<'_> { + // SAFETY: The pointer is valid since self is a reference. + unsafe { bindings::mmap_write_lock(self.as_raw()) }; + + // INVARIANT: We just acquired the write lock. + MmapWriteLock { mm: self } + } + + /// Lock the mmap read lock. + #[inline] + pub fn mmap_read_lock(&self) -> MmapReadLock<'_> { + // SAFETY: The pointer is valid since self is a reference. + unsafe { bindings::mmap_read_lock(self.as_raw()) }; + + // INVARIANT: We just acquired the read lock. + MmapReadLock { mm: self } + } + + /// Try to lock the mmap read lock. + #[inline] + pub fn mmap_read_trylock(&self) -> Option> { + // SAFETY: The pointer is valid since self is a reference. + let success = unsafe { bindings::mmap_read_trylock(self.as_raw()) }; + + if success { + // INVARIANT: We just acquired the read lock. + Some(MmapReadLock { mm: self }) + } else { + None + } + } +} + +impl MmWithUserAsync { + /// Use `mmput` when dropping this refcount. + pub fn use_mmput(me: ARef) -> ARef { + // SAFETY: The layouts and invariants are compatible. + unsafe { ARef::from_raw(ARef::into_raw(me).cast()) } + } +} + +/// A guard for the mmap read lock. +/// +/// # Invariants +/// +/// This `MmapReadLock` guard owns the mmap read lock. +pub struct MmapReadLock<'a> { + mm: &'a MmWithUser, +} + +impl<'a> MmapReadLock<'a> { + /// Look up a vma at the given address. + #[inline] + pub fn vma_lookup(&self, vma_addr: usize) -> Option<&virt::VmArea> { + // SAFETY: We hold a reference to the mm, so the pointer must be valid. Any value is okay + // for `vma_addr`. + let vma = unsafe { bindings::vma_lookup(self.mm.as_raw(), vma_addr as _) }; + + if vma.is_null() { + None + } else { + // SAFETY: We just checked that a vma was found, so the pointer is valid. Furthermore, + // the returned area will borrow from this read lock guard, so it can only be used + // while the read lock is still held. The returned reference is immutable, so the + // reference cannot be used to modify the area. + unsafe { Some(virt::VmArea::from_raw_vma(vma)) } + } + } +} + +impl Drop for MmapReadLock<'_> { + #[inline] + fn drop(&mut self) { + // SAFETY: We hold the read lock by the type invariants. + unsafe { bindings::mmap_read_unlock(self.mm.as_raw()) }; + } +} + +/// A guard for the mmap write lock. +/// +/// # Invariants +/// +/// This `MmapReadLock` guard owns the mmap write lock. +pub struct MmapWriteLock<'a> { + mm: &'a MmWithUser, +} + +impl<'a> MmapWriteLock<'a> { + /// Look up a vma at the given address. + #[inline] + pub fn vma_lookup(&mut self, vma_addr: usize) -> Option<&mut virt::VmArea> { + // SAFETY: We hold a reference to the mm, so the pointer must be valid. Any value is okay + // for `vma_addr`. + let vma = unsafe { bindings::vma_lookup(self.mm.as_raw(), vma_addr as _) }; + + if vma.is_null() { + None + } else { + // SAFETY: We just checked that a vma was found, so the pointer is valid. Furthermore, + // the returned area will borrow from this write lock guard, so it can only be used + // while the write lock is still held. We hold the write lock, so mutable operations on + // the area are okay. + unsafe { Some(virt::VmArea::from_raw_vma_mut(vma)) } + } + } +} + +impl Drop for MmapWriteLock<'_> { + #[inline] + fn drop(&mut self) { + // SAFETY: We hold the write lock by the type invariants. + unsafe { bindings::mmap_write_unlock(self.mm.as_raw()) }; + } +} diff --git a/rust/kernel/mm/virt.rs b/rust/kernel/mm/virt.rs new file mode 100644 index 000000000000..ec8cadb09626 --- /dev/null +++ b/rust/kernel/mm/virt.rs @@ -0,0 +1,204 @@ +// SPDX-License-Identifier: GPL-2.0 + +// Copyright (C) 2024 Google LLC. + +//! Virtual memory. + +use crate::{ + bindings, + error::{to_result, Result}, + page::Page, + types::Opaque, +}; + +/// A wrapper for the kernel's `struct vm_area_struct`. +/// +/// It represents an area of virtual memory. +/// +/// # Invariants +/// +/// * If the caller has shared access to this type, then they must hold the mmap read lock. +/// * If the caller has exclusive access to this type, then they must hold the mmap write lock. +#[repr(transparent)] +pub struct VmArea { + vma: Opaque, +} + +impl VmArea { + /// Access a virtual memory area given a raw pointer. + /// + /// # Safety + /// + /// Callers must ensure that `vma` is valid for the duration of 'a, and that the mmap read lock + /// (or write lock) is held for at least the duration of 'a. + #[inline] + pub unsafe fn from_raw_vma<'a>(vma: *const bindings::vm_area_struct) -> &'a Self { + // SAFETY: The caller ensures that the invariants are satisfied for the duration of 'a. + unsafe { &*vma.cast() } + } + + /// Access a virtual memory area given a raw pointer. + /// + /// # Safety + /// + /// Callers must ensure that `vma` is valid for the duration of 'a, and that the mmap write + /// lock is held for at least the duration of 'a. + #[inline] + pub unsafe fn from_raw_vma_mut<'a>(vma: *mut bindings::vm_area_struct) -> &'a mut Self { + // SAFETY: The caller ensures that the invariants are satisfied for the duration of 'a. + unsafe { &mut *vma.cast() } + } + + /// Returns a raw pointer to this area. + #[inline] + pub fn as_ptr(&self) -> *mut bindings::vm_area_struct { + self.vma.get() + } + + /// Returns the flags associated with the virtual memory area. + /// + /// The possible flags are a combination of the constants in [`flags`]. + #[inline] + pub fn flags(&self) -> usize { + // SAFETY: By the type invariants, the caller holds at least the mmap read lock, so this + // access is not a data race. + unsafe { (*self.as_ptr()).__bindgen_anon_2.vm_flags as _ } + } + + /// Sets the flags associated with the virtual memory area. + /// + /// The possible flags are a combination of the constants in [`flags`]. + #[inline] + pub fn set_flags(&mut self, flags: usize) { + // SAFETY: By the type invariants, the caller holds the mmap write lock, so this access is + // not a data race. + unsafe { (*self.as_ptr()).__bindgen_anon_2.vm_flags = flags as _ }; + } + + /// Returns the start address of the virtual memory area. + #[inline] + pub fn start(&self) -> usize { + // SAFETY: By the type invariants, the caller holds at least the mmap read lock, so this + // access is not a data race. + unsafe { (*self.as_ptr()).__bindgen_anon_1.__bindgen_anon_1.vm_start as _ } + } + + /// Returns the end address of the virtual memory area. + #[inline] + pub fn end(&self) -> usize { + // SAFETY: By the type invariants, the caller holds at least the mmap read lock, so this + // access is not a data race. + unsafe { (*self.as_ptr()).__bindgen_anon_1.__bindgen_anon_1.vm_end as _ } + } + + /// Make this vma anonymous. + #[inline] + pub fn set_anonymous(&mut self) { + // SAFETY: By the type invariants, the caller holds the mmap write lock, so this access is + // not a data race. + unsafe { (*self.as_ptr()).vm_ops = core::ptr::null() }; + } + + /// Maps a single page at the given address within the virtual memory area. + /// + /// This operation does not take ownership of the page. + #[inline] + pub fn vm_insert_page(&mut self, address: usize, page: &Page) -> Result { + // SAFETY: By the type invariants, the caller holds the mmap write lock, so this access is + // not a data race. The page is guaranteed to be valid and of order 0. The range of + // `address` is already checked by `vm_insert_page`. + to_result(unsafe { bindings::vm_insert_page(self.as_ptr(), address as _, page.as_ptr()) }) + } + + /// Unmap pages in the given page range. + #[inline] + pub fn zap_page_range_single(&self, address: usize, size: usize) { + // SAFETY: By the type invariants, the caller holds at least the mmap read lock, so this + // access is okay. Any value of `address` and `size` is allowed. + unsafe { + bindings::zap_page_range_single( + self.as_ptr(), + address as _, + size as _, + core::ptr::null_mut(), + ) + }; + } +} + +/// Container for [`VmArea`] flags. +pub mod flags { + use crate::bindings; + + /// No flags are set. + pub const NONE: usize = bindings::VM_NONE as _; + + /// Mapping allows reads. + pub const READ: usize = bindings::VM_READ as _; + + /// Mapping allows writes. + pub const WRITE: usize = bindings::VM_WRITE as _; + + /// Mapping allows execution. + pub const EXEC: usize = bindings::VM_EXEC as _; + + /// Mapping is shared. + pub const SHARED: usize = bindings::VM_SHARED as _; + + /// Mapping may be updated to allow reads. + pub const MAYREAD: usize = bindings::VM_MAYREAD as _; + + /// Mapping may be updated to allow writes. + pub const MAYWRITE: usize = bindings::VM_MAYWRITE as _; + + /// Mapping may be updated to allow execution. + pub const MAYEXEC: usize = bindings::VM_MAYEXEC as _; + + /// Mapping may be updated to be shared. + pub const MAYSHARE: usize = bindings::VM_MAYSHARE as _; + + /// Do not copy this vma on fork. + pub const DONTCOPY: usize = bindings::VM_DONTCOPY as _; + + /// Cannot expand with mremap(). + pub const DONTEXPAND: usize = bindings::VM_DONTEXPAND as _; + + /// Lock the pages covered when they are faulted in. + pub const LOCKONFAULT: usize = bindings::VM_LOCKONFAULT as _; + + /// Is a VM accounted object. + pub const ACCOUNT: usize = bindings::VM_ACCOUNT as _; + + /// should the VM suppress accounting. + pub const NORESERVE: usize = bindings::VM_NORESERVE as _; + + /// Huge TLB Page VM. + pub const HUGETLB: usize = bindings::VM_HUGETLB as _; + + /// Synchronous page faults. + pub const SYNC: usize = bindings::VM_SYNC as _; + + /// Architecture-specific flag. + pub const ARCH_1: usize = bindings::VM_ARCH_1 as _; + + /// Wipe VMA contents in child.. + pub const WIPEONFORK: usize = bindings::VM_WIPEONFORK as _; + + /// Do not include in the core dump. + pub const DONTDUMP: usize = bindings::VM_DONTDUMP as _; + + /// Not soft dirty clean area. + pub const SOFTDIRTY: usize = bindings::VM_SOFTDIRTY as _; + + /// Can contain "struct page" and pure PFN pages. + pub const MIXEDMAP: usize = bindings::VM_MIXEDMAP as _; + + /// MADV_HUGEPAGE marked this vma. + pub const HUGEPAGE: usize = bindings::VM_HUGEPAGE as _; + + /// MADV_NOHUGEPAGE marked this vma. + pub const NOHUGEPAGE: usize = bindings::VM_NOHUGEPAGE as _; + + /// KSM may merge identical pages. + pub const MERGEABLE: usize = bindings::VM_MERGEABLE as _; +} diff --git a/rust/kernel/types.rs b/rust/kernel/types.rs index bd189d646adb..143a2bf06941 100644 --- a/rust/kernel/types.rs +++ b/rust/kernel/types.rs @@ -366,6 +366,15 @@ pub unsafe fn from_raw(ptr: NonNull) -> Self { _p: PhantomData, } } + + /// Pass ownership of the refcount to a raw pointer. + pub fn into_raw(self) -> NonNull { + let ptr = self.ptr; + // Skip the destructor. + core::mem::forget(self); + + ptr + } } impl Clone for ARef {