2020-06-15 11:29:07 +00:00
|
|
|
|
//! Partitions a list of files into disjoint subsets.
|
|
|
|
|
//!
|
|
|
|
|
//! Files which do not belong to any explicitly configured `FileSet` belong to
|
|
|
|
|
//! the default `FileSet`.
|
2020-07-07 20:53:12 +00:00
|
|
|
|
use std::fmt;
|
2020-06-15 11:29:07 +00:00
|
|
|
|
|
2020-07-07 20:53:12 +00:00
|
|
|
|
use fst::{IntoStreamer, Streamer};
|
2020-06-15 11:29:07 +00:00
|
|
|
|
use rustc_hash::FxHashMap;
|
|
|
|
|
|
|
|
|
|
use crate::{FileId, Vfs, VfsPath};
|
|
|
|
|
|
|
|
|
|
#[derive(Default, Clone, Eq, PartialEq)]
|
|
|
|
|
pub struct FileSet {
|
|
|
|
|
files: FxHashMap<VfsPath, FileId>,
|
|
|
|
|
paths: FxHashMap<FileId, VfsPath>,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl FileSet {
|
2020-07-07 15:38:02 +00:00
|
|
|
|
pub fn len(&self) -> usize {
|
|
|
|
|
self.files.len()
|
|
|
|
|
}
|
2020-06-15 11:29:07 +00:00
|
|
|
|
pub fn resolve_path(&self, anchor: FileId, path: &str) -> Option<FileId> {
|
2020-09-03 22:32:06 +00:00
|
|
|
|
let mut base = self.paths[&anchor].clone();
|
2020-06-15 11:29:07 +00:00
|
|
|
|
base.pop();
|
2020-09-03 22:32:06 +00:00
|
|
|
|
let path = base.join(path)?;
|
2020-08-28 18:28:30 +00:00
|
|
|
|
self.files.get(&path).copied()
|
|
|
|
|
}
|
2020-09-03 20:18:23 +00:00
|
|
|
|
|
2020-09-05 22:41:18 +00:00
|
|
|
|
pub fn possible_sudmobule_names(&self, module_file: FileId) -> Vec<String> {
|
|
|
|
|
let directory_to_look_for_submodules = match self.get_directory_with_submodules(module_file)
|
|
|
|
|
{
|
|
|
|
|
Some(directory) => directory,
|
|
|
|
|
None => return Vec::new(),
|
2020-09-04 10:33:07 +00:00
|
|
|
|
};
|
2020-09-05 22:41:18 +00:00
|
|
|
|
self.paths
|
|
|
|
|
.iter()
|
|
|
|
|
.filter_map(|(_, path)| {
|
|
|
|
|
if path.parent()? == directory_to_look_for_submodules {
|
|
|
|
|
path.file_name_and_extension()
|
|
|
|
|
} else {
|
|
|
|
|
None
|
|
|
|
|
}
|
|
|
|
|
})
|
|
|
|
|
.filter_map(|file_name_and_extension| match file_name_and_extension {
|
|
|
|
|
// TODO kb do not include the module file name itself, if present
|
|
|
|
|
// TODO kb wrong resolution for nesСпаted non-file modules (mod tests {mod <|>)
|
|
|
|
|
// TODO kb in src/bin when a module is included into another,
|
|
|
|
|
// the included file gets "moved" into a directory below and now cannot add any other modules
|
|
|
|
|
("mod", Some("rs")) | ("lib", Some("rs")) | ("main", Some("rs")) => None,
|
|
|
|
|
(file_name, Some("rs")) => Some(file_name.to_owned()),
|
|
|
|
|
(subdirectory_name, None) => {
|
|
|
|
|
let mod_rs_path =
|
|
|
|
|
directory_to_look_for_submodules.join(subdirectory_name)?.join("mod.rs")?;
|
|
|
|
|
if self.files.contains_key(&mod_rs_path) {
|
|
|
|
|
Some(subdirectory_name.to_owned())
|
2020-09-03 23:25:00 +00:00
|
|
|
|
} else {
|
|
|
|
|
None
|
|
|
|
|
}
|
2020-09-05 22:41:18 +00:00
|
|
|
|
}
|
|
|
|
|
_ => None,
|
|
|
|
|
})
|
|
|
|
|
.collect()
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
fn get_directory_with_submodules(&self, module_file: FileId) -> Option<VfsPath> {
|
|
|
|
|
let module_file_path = &self.paths[&module_file];
|
|
|
|
|
let module_directory_path = module_file_path.parent()?;
|
|
|
|
|
match module_file_path.file_name_and_extension() {
|
|
|
|
|
Some(("mod", Some("rs"))) | Some(("lib", Some("rs"))) | Some(("main", Some("rs"))) => {
|
|
|
|
|
Some(module_directory_path)
|
|
|
|
|
}
|
|
|
|
|
Some((regular_rust_file_name, Some("rs"))) => {
|
|
|
|
|
if matches!(
|
|
|
|
|
(
|
|
|
|
|
module_directory_path
|
|
|
|
|
.parent()
|
|
|
|
|
.as_ref()
|
|
|
|
|
.and_then(|path| path.file_name_and_extension()),
|
|
|
|
|
module_directory_path.file_name_and_extension(),
|
|
|
|
|
),
|
|
|
|
|
(Some(("src", None)), Some(("bin", None)))
|
|
|
|
|
) {
|
|
|
|
|
// files in /src/bin/ can import each other directly
|
|
|
|
|
Some(module_directory_path)
|
|
|
|
|
} else {
|
|
|
|
|
module_directory_path.join(regular_rust_file_name)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
_ => None,
|
2020-09-04 10:33:07 +00:00
|
|
|
|
}
|
2020-06-15 11:29:07 +00:00
|
|
|
|
}
|
2020-09-05 22:41:18 +00:00
|
|
|
|
|
2020-06-15 11:29:07 +00:00
|
|
|
|
pub fn insert(&mut self, file_id: FileId, path: VfsPath) {
|
|
|
|
|
self.files.insert(path.clone(), file_id);
|
|
|
|
|
self.paths.insert(file_id, path);
|
|
|
|
|
}
|
|
|
|
|
pub fn iter(&self) -> impl Iterator<Item = FileId> + '_ {
|
|
|
|
|
self.paths.keys().copied()
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl fmt::Debug for FileSet {
|
|
|
|
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
|
|
|
|
f.debug_struct("FileSet").field("n_files", &self.files.len()).finish()
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[derive(Debug)]
|
|
|
|
|
pub struct FileSetConfig {
|
|
|
|
|
n_file_sets: usize,
|
2020-07-07 20:53:12 +00:00
|
|
|
|
map: fst::Map<Vec<u8>>,
|
2020-06-15 11:29:07 +00:00
|
|
|
|
}
|
|
|
|
|
|
2020-06-19 13:07:32 +00:00
|
|
|
|
impl Default for FileSetConfig {
|
|
|
|
|
fn default() -> Self {
|
|
|
|
|
FileSetConfig::builder().build()
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2020-06-15 11:29:07 +00:00
|
|
|
|
impl FileSetConfig {
|
|
|
|
|
pub fn builder() -> FileSetConfigBuilder {
|
|
|
|
|
FileSetConfigBuilder::default()
|
|
|
|
|
}
|
|
|
|
|
pub fn partition(&self, vfs: &Vfs) -> Vec<FileSet> {
|
2020-07-07 20:53:12 +00:00
|
|
|
|
let mut scratch_space = Vec::new();
|
2020-06-15 11:29:07 +00:00
|
|
|
|
let mut res = vec![FileSet::default(); self.len()];
|
|
|
|
|
for (file_id, path) in vfs.iter() {
|
2020-07-07 20:53:12 +00:00
|
|
|
|
let root = self.classify(&path, &mut scratch_space);
|
2020-07-14 13:57:10 +00:00
|
|
|
|
res[root].insert(file_id, path.clone())
|
2020-06-15 11:29:07 +00:00
|
|
|
|
}
|
|
|
|
|
res
|
|
|
|
|
}
|
|
|
|
|
fn len(&self) -> usize {
|
|
|
|
|
self.n_file_sets
|
|
|
|
|
}
|
2020-07-07 20:53:12 +00:00
|
|
|
|
fn classify(&self, path: &VfsPath, scratch_space: &mut Vec<u8>) -> usize {
|
|
|
|
|
scratch_space.clear();
|
|
|
|
|
path.encode(scratch_space);
|
|
|
|
|
let automaton = PrefixOf::new(scratch_space.as_slice());
|
|
|
|
|
let mut longest_prefix = self.len() - 1;
|
|
|
|
|
let mut stream = self.map.search(automaton).into_stream();
|
|
|
|
|
while let Some((_, v)) = stream.next() {
|
|
|
|
|
longest_prefix = v as usize;
|
|
|
|
|
}
|
|
|
|
|
longest_prefix
|
2020-06-15 11:29:07 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pub struct FileSetConfigBuilder {
|
2020-06-11 09:04:09 +00:00
|
|
|
|
roots: Vec<Vec<VfsPath>>,
|
2020-06-15 11:29:07 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl Default for FileSetConfigBuilder {
|
|
|
|
|
fn default() -> Self {
|
|
|
|
|
FileSetConfigBuilder { roots: Vec::new() }
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl FileSetConfigBuilder {
|
2020-06-19 13:07:32 +00:00
|
|
|
|
pub fn len(&self) -> usize {
|
|
|
|
|
self.roots.len()
|
|
|
|
|
}
|
2020-06-11 09:04:09 +00:00
|
|
|
|
pub fn add_file_set(&mut self, roots: Vec<VfsPath>) {
|
2020-06-15 11:29:07 +00:00
|
|
|
|
self.roots.push(roots)
|
|
|
|
|
}
|
|
|
|
|
pub fn build(self) -> FileSetConfig {
|
|
|
|
|
let n_file_sets = self.roots.len() + 1;
|
2020-07-07 20:53:12 +00:00
|
|
|
|
let map = {
|
|
|
|
|
let mut entries = Vec::new();
|
|
|
|
|
for (i, paths) in self.roots.into_iter().enumerate() {
|
|
|
|
|
for p in paths {
|
|
|
|
|
let mut buf = Vec::new();
|
|
|
|
|
p.encode(&mut buf);
|
|
|
|
|
entries.push((buf, i as u64));
|
|
|
|
|
}
|
2020-07-07 15:38:02 +00:00
|
|
|
|
}
|
2020-07-07 20:53:12 +00:00
|
|
|
|
entries.sort();
|
|
|
|
|
entries.dedup_by(|(a, _), (b, _)| a == b);
|
|
|
|
|
fst::Map::from_iter(entries).unwrap()
|
|
|
|
|
};
|
|
|
|
|
FileSetConfig { n_file_sets, map }
|
2020-07-07 15:38:02 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2020-07-07 20:53:12 +00:00
|
|
|
|
struct PrefixOf<'a> {
|
|
|
|
|
prefix_of: &'a [u8],
|
2020-07-07 15:38:02 +00:00
|
|
|
|
}
|
|
|
|
|
|
2020-07-07 20:53:12 +00:00
|
|
|
|
impl<'a> PrefixOf<'a> {
|
|
|
|
|
fn new(prefix_of: &'a [u8]) -> Self {
|
|
|
|
|
Self { prefix_of }
|
2020-07-07 15:38:02 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2020-07-07 20:53:12 +00:00
|
|
|
|
impl fst::Automaton for PrefixOf<'_> {
|
|
|
|
|
type State = usize;
|
|
|
|
|
fn start(&self) -> usize {
|
|
|
|
|
0
|
|
|
|
|
}
|
|
|
|
|
fn is_match(&self, &state: &usize) -> bool {
|
|
|
|
|
state != !0
|
|
|
|
|
}
|
|
|
|
|
fn can_match(&self, &state: &usize) -> bool {
|
|
|
|
|
state != !0
|
|
|
|
|
}
|
|
|
|
|
fn accept(&self, &state: &usize, byte: u8) -> usize {
|
|
|
|
|
if self.prefix_of.get(state) == Some(&byte) {
|
|
|
|
|
state + 1
|
|
|
|
|
} else {
|
|
|
|
|
!0
|
2020-07-07 15:38:02 +00:00
|
|
|
|
}
|
2020-06-15 11:29:07 +00:00
|
|
|
|
}
|
2020-07-07 15:38:02 +00:00
|
|
|
|
}
|
|
|
|
|
|
2020-07-26 09:05:28 +00:00
|
|
|
|
#[cfg(test)]
|
|
|
|
|
mod tests {
|
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn path_prefix() {
|
|
|
|
|
let mut file_set = FileSetConfig::builder();
|
|
|
|
|
file_set.add_file_set(vec![VfsPath::new_virtual_path("/foo".into())]);
|
|
|
|
|
file_set.add_file_set(vec![VfsPath::new_virtual_path("/foo/bar/baz".into())]);
|
|
|
|
|
let file_set = file_set.build();
|
|
|
|
|
|
|
|
|
|
let mut vfs = Vfs::default();
|
|
|
|
|
vfs.set_file_contents(
|
|
|
|
|
VfsPath::new_virtual_path("/foo/src/lib.rs".into()),
|
|
|
|
|
Some(Vec::new()),
|
|
|
|
|
);
|
|
|
|
|
vfs.set_file_contents(
|
|
|
|
|
VfsPath::new_virtual_path("/foo/src/bar/baz/lib.rs".into()),
|
|
|
|
|
Some(Vec::new()),
|
|
|
|
|
);
|
|
|
|
|
vfs.set_file_contents(
|
|
|
|
|
VfsPath::new_virtual_path("/foo/bar/baz/lib.rs".into()),
|
|
|
|
|
Some(Vec::new()),
|
|
|
|
|
);
|
|
|
|
|
vfs.set_file_contents(VfsPath::new_virtual_path("/quux/lib.rs".into()), Some(Vec::new()));
|
|
|
|
|
|
|
|
|
|
let partition = file_set.partition(&vfs).into_iter().map(|it| it.len()).collect::<Vec<_>>();
|
|
|
|
|
assert_eq!(partition, vec![2, 1, 1]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn name_prefix() {
|
|
|
|
|
let mut file_set = FileSetConfig::builder();
|
|
|
|
|
file_set.add_file_set(vec![VfsPath::new_virtual_path("/foo".into())]);
|
|
|
|
|
file_set.add_file_set(vec![VfsPath::new_virtual_path("/foo-things".into())]);
|
|
|
|
|
let file_set = file_set.build();
|
|
|
|
|
|
|
|
|
|
let mut vfs = Vfs::default();
|
|
|
|
|
vfs.set_file_contents(
|
|
|
|
|
VfsPath::new_virtual_path("/foo/src/lib.rs".into()),
|
|
|
|
|
Some(Vec::new()),
|
|
|
|
|
);
|
|
|
|
|
vfs.set_file_contents(
|
|
|
|
|
VfsPath::new_virtual_path("/foo-things/src/lib.rs".into()),
|
|
|
|
|
Some(Vec::new()),
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
let partition = file_set.partition(&vfs).into_iter().map(|it| it.len()).collect::<Vec<_>>();
|
|
|
|
|
assert_eq!(partition, vec![1, 1, 0]);
|
|
|
|
|
}
|
2020-06-15 11:29:07 +00:00
|
|
|
|
}
|