//! This module specifies the input to rust-analyzer. In some sense, this is //! **the** most important module, because all other fancy stuff is strictly //! derived from this input. //! //! Note that neither this module, nor any other part of the analyzer's core do //! actual IO. See `vfs` and `project_model` in the `ra_lsp_server` crate for how //! actual IO is done and lowered to input. use std::{fmt, str::FromStr}; use ra_cfg::CfgOptions; use ra_syntax::SmolStr; use rustc_hash::FxHashMap; use rustc_hash::FxHashSet; use crate::{RelativePath, RelativePathBuf}; /// `FileId` is an integer which uniquely identifies a file. File paths are /// messy and system-dependent, so most of the code should work directly with /// `FileId`, without inspecting the path. The mapping between `FileId` and path /// and `SourceRoot` is constant. A file rename is represented as a pair of /// deletion/creation. #[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash)] pub struct FileId(pub u32); /// Files are grouped into source roots. A source root is a directory on the /// file systems which is watched for changes. Typically it corresponds to a /// Rust crate. Source roots *might* be nested: in this case, a file belongs to /// the nearest enclosing source root. Paths to files are always relative to a /// source root, and the analyzer does not know the root path of the source root at /// all. So, a file from one source root can't refer to a file in another source /// root by path. #[derive(Debug, Clone, Copy, PartialEq, Eq, Hash, PartialOrd, Ord)] pub struct SourceRootId(pub u32); #[derive(Clone, Debug, PartialEq, Eq)] pub struct SourceRoot { /// Sysroot or crates.io library. /// /// Libraries are considered mostly immutable, this assumption is used to /// optimize salsa's query structure pub is_library: bool, files: FxHashMap, } impl SourceRoot { pub fn new_local() -> SourceRoot { SourceRoot { is_library: false, files: Default::default() } } pub fn new_library() -> SourceRoot { SourceRoot { is_library: true, files: Default::default() } } pub fn insert_file(&mut self, path: RelativePathBuf, file_id: FileId) { self.files.insert(path, file_id); } pub fn remove_file(&mut self, path: &RelativePath) { self.files.remove(path); } pub fn walk(&self) -> impl Iterator + '_ { self.files.values().copied() } pub fn file_by_relative_path(&self, path: &RelativePath) -> Option { self.files.get(path).copied() } } /// `CrateGraph` is a bit of information which turns a set of text files into a /// number of Rust crates. Each crate is defined by the `FileId` of its root module, /// the set of cfg flags (not yet implemented) and the set of dependencies. Note /// that, due to cfg's, there might be several crates for a single `FileId`! As /// in the rust-lang proper, a crate does not have a name. Instead, names are /// specified on dependency edges. That is, a crate might be known under /// different names in different dependent crates. /// /// Note that `CrateGraph` is build-system agnostic: it's a concept of the Rust /// language proper, not a concept of the build system. In practice, we get /// `CrateGraph` by lowering `cargo metadata` output. #[derive(Debug, Clone, Default, PartialEq, Eq)] pub struct CrateGraph { arena: FxHashMap, } #[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash)] pub struct CrateId(pub u32); pub struct CrateName(SmolStr); impl> From for CrateName { fn from(name: T) -> Self { // For root projects with dashes in their name, // cargo metadata does not do any normalization // so we do it ourselves Self(SmolStr::new(name.as_ref().replace('-', "_"))) } } #[derive(Debug, Clone, PartialEq, Eq)] struct CrateData { file_id: FileId, edition: Edition, cfg_options: CfgOptions, env: Env, dependencies: Vec, } #[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)] pub enum Edition { Edition2018, Edition2015, } #[derive(Default, Debug, Clone, PartialEq, Eq)] pub struct Env { entries: FxHashMap, } #[derive(Debug, Clone, PartialEq, Eq)] pub struct Dependency { pub crate_id: CrateId, pub name: SmolStr, } impl CrateGraph { pub fn add_crate_root( &mut self, file_id: FileId, edition: Edition, cfg_options: CfgOptions, env: Env, ) -> CrateId { let data = CrateData::new(file_id, edition, cfg_options, env); let crate_id = CrateId(self.arena.len() as u32); let prev = self.arena.insert(crate_id, data); assert!(prev.is_none()); crate_id } pub fn cfg_options(&self, crate_id: CrateId) -> &CfgOptions { &self.arena[&crate_id].cfg_options } pub fn add_dep( &mut self, from: CrateId, name: CrateName, to: CrateId, ) -> Result<(), CyclicDependenciesError> { if self.dfs_find(from, to, &mut FxHashSet::default()) { return Err(CyclicDependenciesError); } self.arena.get_mut(&from).unwrap().add_dep(name.0, to); Ok(()) } pub fn is_empty(&self) -> bool { self.arena.is_empty() } pub fn iter<'a>(&'a self) -> impl Iterator + 'a { self.arena.keys().copied() } pub fn crate_root(&self, crate_id: CrateId) -> FileId { self.arena[&crate_id].file_id } pub fn edition(&self, crate_id: CrateId) -> Edition { self.arena[&crate_id].edition } // FIXME: this only finds one crate with the given root; we could have multiple pub fn crate_id_for_crate_root(&self, file_id: FileId) -> Option { let (&crate_id, _) = self.arena.iter().find(|(_crate_id, data)| data.file_id == file_id)?; Some(crate_id) } pub fn dependencies<'a>( &'a self, crate_id: CrateId, ) -> impl Iterator + 'a { self.arena[&crate_id].dependencies.iter() } /// Extends this crate graph by adding a complete disjoint second crate /// graph. /// /// The ids of the crates in the `other` graph are shifted by the return /// amount. pub fn extend(&mut self, other: CrateGraph) -> u32 { let start = self.arena.len() as u32; self.arena.extend(other.arena.into_iter().map(|(id, mut data)| { let new_id = id.shift(start); for dep in &mut data.dependencies { dep.crate_id = dep.crate_id.shift(start); } (new_id, data) })); start } fn dfs_find(&self, target: CrateId, from: CrateId, visited: &mut FxHashSet) -> bool { if !visited.insert(from) { return false; } for dep in self.dependencies(from) { let crate_id = dep.crate_id(); if crate_id == target { return true; } if self.dfs_find(target, crate_id, visited) { return true; } } false } } impl CrateId { pub fn shift(self, amount: u32) -> CrateId { CrateId(self.0 + amount) } } impl CrateData { fn new(file_id: FileId, edition: Edition, cfg_options: CfgOptions, env: Env) -> CrateData { CrateData { file_id, edition, dependencies: Vec::new(), cfg_options, env } } fn add_dep(&mut self, name: SmolStr, crate_id: CrateId) { self.dependencies.push(Dependency { name, crate_id }) } } impl FromStr for Edition { type Err = ParseEditionError; fn from_str(s: &str) -> Result { let res = match s { "2015" => Edition::Edition2015, "2018" => Edition::Edition2018, _ => Err(ParseEditionError { invalid_input: s.to_string() })?, }; Ok(res) } } impl fmt::Display for Edition { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { f.write_str(match self { Edition::Edition2015 => "2015", Edition::Edition2018 => "2018", }) } } impl Dependency { pub fn crate_id(&self) -> CrateId { self.crate_id } } #[derive(Debug)] pub struct ParseEditionError { invalid_input: String, } impl fmt::Display for ParseEditionError { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { write!(f, "invalid edition: {:?}", self.invalid_input) } } impl std::error::Error for ParseEditionError {} #[derive(Debug)] pub struct CyclicDependenciesError; #[cfg(test)] mod tests { use super::{CfgOptions, CrateGraph, Dependency, Edition::Edition2018, Env, FileId}; #[test] fn it_should_panic_because_of_cycle_dependencies() { let mut graph = CrateGraph::default(); let crate1 = graph.add_crate_root(FileId(1u32), Edition2018, CfgOptions::default(), Env::default()); let crate2 = graph.add_crate_root(FileId(2u32), Edition2018, CfgOptions::default(), Env::default()); let crate3 = graph.add_crate_root(FileId(3u32), Edition2018, CfgOptions::default(), Env::default()); assert!(graph.add_dep(crate1, "crate2".into(), crate2).is_ok()); assert!(graph.add_dep(crate2, "crate3".into(), crate3).is_ok()); assert!(graph.add_dep(crate3, "crate1".into(), crate1).is_err()); } #[test] fn it_works() { let mut graph = CrateGraph::default(); let crate1 = graph.add_crate_root(FileId(1u32), Edition2018, CfgOptions::default(), Env::default()); let crate2 = graph.add_crate_root(FileId(2u32), Edition2018, CfgOptions::default(), Env::default()); let crate3 = graph.add_crate_root(FileId(3u32), Edition2018, CfgOptions::default(), Env::default()); assert!(graph.add_dep(crate1, "crate2".into(), crate2).is_ok()); assert!(graph.add_dep(crate2, "crate3".into(), crate3).is_ok()); } #[test] fn dashes_are_normalized() { let mut graph = CrateGraph::default(); let crate1 = graph.add_crate_root(FileId(1u32), Edition2018, CfgOptions::default(), Env::default()); let crate2 = graph.add_crate_root(FileId(2u32), Edition2018, CfgOptions::default(), Env::default()); assert!(graph.add_dep(crate1, "crate-name-with-dashes".into(), crate2).is_ok()); assert_eq!( graph.dependencies(crate1).collect::>(), vec![&Dependency { crate_id: crate2, name: "crate_name_with_dashes".into() }] ); } }