-
Notifications
You must be signed in to change notification settings - Fork 1.2k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Enforce extension validity at parse time (#5888)
This PR adds a `DistExtension` field to some of our distribution types, which requires that we validate that the file type is known and supported when parsing (rather than when attempting to unzip). It removes a bunch of extension parsing from the code too, in favor of doing it once upfront. Closes #5858.
- Loading branch information
1 parent
66b6d7a
commit ec5c1f6
Showing
36 changed files
with
805 additions
and
482 deletions.
There are no files selected for viewing
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,99 @@ | ||
use std::fmt::{Display, Formatter}; | ||
use std::path::Path; | ||
|
||
use serde::{Deserialize, Serialize}; | ||
use thiserror::Error; | ||
|
||
#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)] | ||
pub enum DistExtension { | ||
Wheel, | ||
Source(SourceDistExtension), | ||
} | ||
|
||
#[derive( | ||
Clone, | ||
Copy, | ||
Debug, | ||
PartialEq, | ||
Eq, | ||
PartialOrd, | ||
Ord, | ||
Hash, | ||
Serialize, | ||
Deserialize, | ||
rkyv::Archive, | ||
rkyv::Deserialize, | ||
rkyv::Serialize, | ||
)] | ||
#[archive(check_bytes)] | ||
#[archive_attr(derive(Debug))] | ||
pub enum SourceDistExtension { | ||
Zip, | ||
TarGz, | ||
TarBz2, | ||
TarXz, | ||
TarZst, | ||
} | ||
|
||
impl DistExtension { | ||
/// Extract the [`DistExtension`] from a path. | ||
pub fn from_path(path: impl AsRef<Path>) -> Result<Self, ExtensionError> { | ||
let Some(extension) = path.as_ref().extension().and_then(|ext| ext.to_str()) else { | ||
return Err(ExtensionError::Dist); | ||
}; | ||
|
||
match extension { | ||
"whl" => Ok(Self::Wheel), | ||
_ => SourceDistExtension::from_path(path) | ||
.map(Self::Source) | ||
.map_err(|_| ExtensionError::Dist), | ||
} | ||
} | ||
} | ||
|
||
impl SourceDistExtension { | ||
/// Extract the [`SourceDistExtension`] from a path. | ||
pub fn from_path(path: impl AsRef<Path>) -> Result<Self, ExtensionError> { | ||
/// Returns true if the path is a tar file (e.g., `.tar.gz`). | ||
fn is_tar(path: &Path) -> bool { | ||
path.file_stem().is_some_and(|stem| { | ||
Path::new(stem) | ||
.extension() | ||
.is_some_and(|ext| ext.eq_ignore_ascii_case("tar")) | ||
}) | ||
} | ||
|
||
let Some(extension) = path.as_ref().extension().and_then(|ext| ext.to_str()) else { | ||
return Err(ExtensionError::SourceDist); | ||
}; | ||
|
||
match extension { | ||
"zip" => Ok(Self::Zip), | ||
"gz" if is_tar(path.as_ref()) => Ok(Self::TarGz), | ||
"bz2" if is_tar(path.as_ref()) => Ok(Self::TarBz2), | ||
"xz" if is_tar(path.as_ref()) => Ok(Self::TarXz), | ||
"zst" if is_tar(path.as_ref()) => Ok(Self::TarZst), | ||
_ => Err(ExtensionError::SourceDist), | ||
} | ||
} | ||
} | ||
|
||
impl Display for SourceDistExtension { | ||
fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { | ||
match self { | ||
Self::Zip => f.write_str("zip"), | ||
Self::TarGz => f.write_str("tar.gz"), | ||
Self::TarBz2 => f.write_str("tar.bz2"), | ||
Self::TarXz => f.write_str("tar.xz"), | ||
Self::TarZst => f.write_str("tar.zst"), | ||
} | ||
} | ||
} | ||
|
||
#[derive(Error, Debug)] | ||
pub enum ExtensionError { | ||
#[error("`.whl`, `.zip`, `.tar.gz`, `.tar.bz2`, `.tar.xz`, or `.tar.zst`")] | ||
Dist, | ||
#[error("`.zip`, `.tar.gz`, `.tar.bz2`, `.tar.xz`, or `.tar.zst`")] | ||
SourceDist, | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.