Add more documentation for term search

This commit is contained in:
Tavo Annus 2023-12-12 16:34:31 +02:00
parent bb3c7cff60
commit 35eb0dbbc0
3 changed files with 120 additions and 13 deletions

View File

@ -12,25 +12,45 @@
mod tactics; mod tactics;
/// # Maximum amount of variations to take per type
///
/// This is to speed up term search as there may be huge amount of variations of arguments for
/// function, even when the return type is always the same. The idea is to take first n and call it
/// a day.
const MAX_VARIATIONS: usize = 10; const MAX_VARIATIONS: usize = 10;
/// Key for lookup table to query new types reached.
#[derive(Debug, Hash, PartialEq, Eq)] #[derive(Debug, Hash, PartialEq, Eq)]
enum NewTypesKey { enum NewTypesKey {
ImplMethod, ImplMethod,
StructProjection, StructProjection,
} }
/// Lookup table for term search /// # Lookup table for term search
///
/// Lookup table keeps all the state during term search.
/// This means it knows what types and how are reachable.
///
/// The secondary functionality for lookup table is to keep track of new types reached since last
/// iteration as well as keeping track of which `ScopeDef` items have been used.
/// Both of them are to speed up the term search by leaving out types / ScopeDefs that likely do
/// not produce any new results.
#[derive(Default, Debug)] #[derive(Default, Debug)]
struct LookupTable { struct LookupTable {
/// All the `TypeTree`s in "value" produce the type of "key"
data: FxHashMap<Type, FxHashSet<TypeTree>>, data: FxHashMap<Type, FxHashSet<TypeTree>>,
/// New types reached since last query by the `NewTypesKey`
new_types: FxHashMap<NewTypesKey, Vec<Type>>, new_types: FxHashMap<NewTypesKey, Vec<Type>>,
/// ScopeDefs that are not interesting any more
exhausted_scopedefs: FxHashSet<ScopeDef>, exhausted_scopedefs: FxHashSet<ScopeDef>,
/// ScopeDefs that were used in current round
round_scopedef_hits: FxHashSet<ScopeDef>, round_scopedef_hits: FxHashSet<ScopeDef>,
scopedef_hits: FxHashMap<ScopeDef, u32>, /// Amount of rounds since scopedef was first used.
rounds_since_sopedef_hit: FxHashMap<ScopeDef, u32>,
} }
impl LookupTable { impl LookupTable {
/// Initialize lookup table
fn new() -> Self { fn new() -> Self {
let mut res: Self = Default::default(); let mut res: Self = Default::default();
res.new_types.insert(NewTypesKey::ImplMethod, Vec::new()); res.new_types.insert(NewTypesKey::ImplMethod, Vec::new());
@ -38,6 +58,7 @@ fn new() -> Self {
res res
} }
/// Find all `TypeTree`s that unify with the `ty`
fn find(&self, db: &dyn HirDatabase, ty: &Type) -> Option<Vec<TypeTree>> { fn find(&self, db: &dyn HirDatabase, ty: &Type) -> Option<Vec<TypeTree>> {
self.data self.data
.iter() .iter()
@ -45,6 +66,10 @@ fn find(&self, db: &dyn HirDatabase, ty: &Type) -> Option<Vec<TypeTree>> {
.map(|(_, tts)| tts.iter().cloned().collect()) .map(|(_, tts)| tts.iter().cloned().collect())
} }
/// Same as find but automatically creates shared reference of types in the lookup
///
/// For example if we have type `i32` in data and we query for `&i32` it map all the type
/// trees we have for `i32` with `TypeTree::Reference` and returns them.
fn find_autoref(&self, db: &dyn HirDatabase, ty: &Type) -> Option<Vec<TypeTree>> { fn find_autoref(&self, db: &dyn HirDatabase, ty: &Type) -> Option<Vec<TypeTree>> {
self.data self.data
.iter() .iter()
@ -62,6 +87,11 @@ fn find_autoref(&self, db: &dyn HirDatabase, ty: &Type) -> Option<Vec<TypeTree>>
}) })
} }
/// Insert new type trees for type
///
/// Note that the types have to be the same, unification is not enough as unification is not
/// transitive. For example Vec<i32> and FxHashSet<i32> both unify with Iterator<Item = i32>,
/// but they clearly do not unify themselves.
fn insert(&mut self, ty: Type, trees: impl Iterator<Item = TypeTree>) { fn insert(&mut self, ty: Type, trees: impl Iterator<Item = TypeTree>) {
match self.data.get_mut(&ty) { match self.data.get_mut(&ty) {
Some(it) => it.extend(trees.take(MAX_VARIATIONS)), Some(it) => it.extend(trees.take(MAX_VARIATIONS)),
@ -74,10 +104,14 @@ fn insert(&mut self, ty: Type, trees: impl Iterator<Item = TypeTree>) {
} }
} }
/// Iterate all the reachable types
fn iter_types(&self) -> impl Iterator<Item = Type> + '_ { fn iter_types(&self) -> impl Iterator<Item = Type> + '_ {
self.data.keys().cloned() self.data.keys().cloned()
} }
/// Query new types reached since last query by key
///
/// Create new key if you wish to query it to avoid conflicting with existing queries.
fn new_types(&mut self, key: NewTypesKey) -> Vec<Type> { fn new_types(&mut self, key: NewTypesKey) -> Vec<Type> {
match self.new_types.get_mut(&key) { match self.new_types.get_mut(&key) {
Some(it) => std::mem::take(it), Some(it) => std::mem::take(it),
@ -85,17 +119,24 @@ fn new_types(&mut self, key: NewTypesKey) -> Vec<Type> {
} }
} }
/// Mark `ScopeDef` as exhausted meaning it is not interesting for us any more
fn mark_exhausted(&mut self, def: ScopeDef) { fn mark_exhausted(&mut self, def: ScopeDef) {
self.exhausted_scopedefs.insert(def); self.exhausted_scopedefs.insert(def);
} }
/// Mark `ScopeDef` as used meaning we managed to produce something useful from it
fn mark_fulfilled(&mut self, def: ScopeDef) { fn mark_fulfilled(&mut self, def: ScopeDef) {
self.round_scopedef_hits.insert(def); self.round_scopedef_hits.insert(def);
} }
/// Start new round (meant to be called at the beginning of iteration in `term_search`)
///
/// This functions marks some `ScopeDef`s as exhausted if there have been
/// `MAX_ROUNDS_AFTER_HIT` rounds after first using a `ScopeDef`.
fn new_round(&mut self) { fn new_round(&mut self) {
for def in &self.round_scopedef_hits { for def in &self.round_scopedef_hits {
let hits = self.scopedef_hits.entry(*def).and_modify(|n| *n += 1).or_insert(0); let hits =
self.rounds_since_sopedef_hit.entry(*def).and_modify(|n| *n += 1).or_insert(0);
const MAX_ROUNDS_AFTER_HIT: u32 = 2; const MAX_ROUNDS_AFTER_HIT: u32 = 2;
if *hits > MAX_ROUNDS_AFTER_HIT { if *hits > MAX_ROUNDS_AFTER_HIT {
self.exhausted_scopedefs.insert(*def); self.exhausted_scopedefs.insert(*def);
@ -104,6 +145,7 @@ fn new_round(&mut self) {
self.round_scopedef_hits.clear(); self.round_scopedef_hits.clear();
} }
/// Get exhausted `ScopeDef`s
fn exhausted_scopedefs(&self) -> &FxHashSet<ScopeDef> { fn exhausted_scopedefs(&self) -> &FxHashSet<ScopeDef> {
&self.exhausted_scopedefs &self.exhausted_scopedefs
} }
@ -117,6 +159,22 @@ fn exhausted_scopedefs(&self) -> &FxHashSet<ScopeDef> {
/// * `sema` - Semantics for the program /// * `sema` - Semantics for the program
/// * `scope` - Semantic scope, captures context for the term search /// * `scope` - Semantic scope, captures context for the term search
/// * `goal` - Target / expected output type /// * `goal` - Target / expected output type
///
/// Internally this function uses Breadth First Search to find path to `goal` type.
/// The general idea is following:
/// 1. Populate lookup (frontier for BFS) from values (local variables, statics, constants, etc)
/// as well as from well knows values (such as `true/false` and `()`)
/// 2. Iteratively expand the frontier (or contents of the lookup) by trying different type
/// transformation tactics. For example functions take as from set of types (arguments) to some
/// type (return type). Other transformations include methods on type, type constructors and
/// projections to struct fields (field access).
/// 3. Once we manage to find path to type we are interested in we continue for single round to see
/// if we can find more paths that take us to the `goal` type.
/// 4. Return all the paths (type trees) that take us to the `goal` type.
///
/// Note that there are usually more ways we can get to the `goal` type but some are discarded to
/// reduce the memory consumption. It is also unlikely anyone is willing ti browse through
/// thousands of possible responses so we currently take first 10 from every tactic.
pub fn term_search<DB: HirDatabase>( pub fn term_search<DB: HirDatabase>(
sema: &Semantics<'_, DB>, sema: &Semantics<'_, DB>,
scope: &SemanticsScope<'_>, scope: &SemanticsScope<'_>,
@ -135,6 +193,7 @@ pub fn term_search<DB: HirDatabase>(
// Try trivial tactic first, also populates lookup table // Try trivial tactic first, also populates lookup table
let mut solutions: Vec<TypeTree> = let mut solutions: Vec<TypeTree> =
tactics::trivial(sema.db, &defs, &mut lookup, goal).collect(); tactics::trivial(sema.db, &defs, &mut lookup, goal).collect();
// Use well known types tactic before iterations as it does not depend on other tactics
solutions.extend(tactics::famous_types(sema.db, &module, &defs, &mut lookup, goal)); solutions.extend(tactics::famous_types(sema.db, &module, &defs, &mut lookup, goal));
let mut solution_found = !solutions.is_empty(); let mut solution_found = !solutions.is_empty();
@ -147,12 +206,14 @@ pub fn term_search<DB: HirDatabase>(
solutions.extend(tactics::impl_method(sema.db, &module, &defs, &mut lookup, goal)); solutions.extend(tactics::impl_method(sema.db, &module, &defs, &mut lookup, goal));
solutions.extend(tactics::struct_projection(sema.db, &module, &defs, &mut lookup, goal)); solutions.extend(tactics::struct_projection(sema.db, &module, &defs, &mut lookup, goal));
// Break after 1 round after successful solution
if solution_found { if solution_found {
break; break;
} }
solution_found = !solutions.is_empty(); solution_found = !solutions.is_empty();
// Discard not interesting `ScopeDef`s for speedup
for def in lookup.exhausted_scopedefs() { for def in lookup.exhausted_scopedefs() {
defs.remove(def); defs.remove(def);
} }

View File

@ -1,4 +1,12 @@
//! Tactics for term search //! Tactics for term search
//!
//! All the tactics take following arguments
//! * `db` - HIR database
//! * `module` - Module where the term search target location
//! * `defs` - Set of items in scope at term search target location
//! * `lookup` - Lookup table for types
//! * `goal` - Term search target type
//! And they return iterator that yields type trees that unify with the `goal` type.
use hir_def::generics::TypeOrConstParamData; use hir_def::generics::TypeOrConstParamData;
use hir_ty::db::HirDatabase; use hir_ty::db::HirDatabase;
@ -16,10 +24,21 @@
use super::{LookupTable, NewTypesKey, MAX_VARIATIONS}; use super::{LookupTable, NewTypesKey, MAX_VARIATIONS};
/// Trivial tactic /// # Trivial tactic
/// ///
/// Attempts to fulfill the goal by trying items in scope /// Attempts to fulfill the goal by trying items in scope
/// Also works as a starting point to move all items in scope to lookup table /// Also works as a starting point to move all items in scope to lookup table.
///
/// # Arguments
/// * `db` - HIR database
/// * `defs` - Set of items in scope at term search target location
/// * `lookup` - Lookup table for types
/// * `goal` - Term search target type
///
/// Returns iterator that yields elements that unify with `goal`.
///
/// _Note that there is no use of calling this tactic in every iteration as the output does not
/// depend on the current state of `lookup`_
pub(super) fn trivial<'a>( pub(super) fn trivial<'a>(
db: &'a dyn HirDatabase, db: &'a dyn HirDatabase,
defs: &'a FxHashSet<ScopeDef>, defs: &'a FxHashSet<ScopeDef>,
@ -67,10 +86,13 @@ pub(super) fn trivial<'a>(
}) })
} }
/// Type constructor tactic /// # Type constructor tactic
/// ///
/// Attempts different type constructors for enums and structs in scope /// Attempts different type constructors for enums and structs in scope
/// ///
/// Updates lookup by new types reached and returns iterator that yields
/// elements that unify with `goal`.
///
/// # Arguments /// # Arguments
/// * `db` - HIR database /// * `db` - HIR database
/// * `module` - Module where the term search target location /// * `module` - Module where the term search target location
@ -255,9 +277,13 @@ fn variant_helper(
.flatten() .flatten()
} }
/// Free function tactic /// # Free function tactic
/// ///
/// Attempts to call different functions in scope with parameters from lookup table /// Attempts to call different functions in scope with parameters from lookup table.
/// Functions that include generics are not used for performance reasons.
///
/// Updates lookup by new types reached and returns iterator that yields
/// elements that unify with `goal`.
/// ///
/// # Arguments /// # Arguments
/// * `db` - HIR database /// * `db` - HIR database
@ -356,10 +382,15 @@ pub(super) fn free_function<'a>(
.flatten() .flatten()
} }
/// Impl method tactic /// # Impl method tactic
/// ///
/// Attempts to to call methods on types from lookup table. /// Attempts to to call methods on types from lookup table.
/// This includes both functions from direct impl blocks as well as functions from traits. /// This includes both functions from direct impl blocks as well as functions from traits.
/// Methods defined in impl blocks that are generic and methods that are themselves have
/// generics are ignored for performance reasons.
///
/// Updates lookup by new types reached and returns iterator that yields
/// elements that unify with `goal`.
/// ///
/// # Arguments /// # Arguments
/// * `db` - HIR database /// * `db` - HIR database
@ -484,9 +515,12 @@ pub(super) fn impl_method<'a>(
.flatten() .flatten()
} }
/// Struct projection tactic /// # Struct projection tactic
/// ///
/// Attempts different struct fields /// Attempts different struct fields (`foo.bar.baz`)
///
/// Updates lookup by new types reached and returns iterator that yields
/// elements that unify with `goal`.
/// ///
/// # Arguments /// # Arguments
/// * `db` - HIR database /// * `db` - HIR database
@ -522,9 +556,14 @@ pub(super) fn struct_projection<'a>(
.flatten() .flatten()
} }
/// Famous types tactic /// # Famous types tactic
/// ///
/// Attempts different values of well known types such as `true` or `false` /// Attempts different values of well known types such as `true` or `false`.
///
/// Updates lookup by new types reached and returns iterator that yields
/// elements that unify with `goal`.
///
/// _Note that there is no point of calling it iteratively as the output is always the same_
/// ///
/// # Arguments /// # Arguments
/// * `db` - HIR database /// * `db` - HIR database

View File

@ -9,6 +9,7 @@
Struct, StructKind, Trait, Type, Variant, Struct, StructKind, Trait, Type, Variant,
}; };
/// Helper function to prefix items with modules when required
fn mod_item_path(db: &dyn HirDatabase, sema_scope: &SemanticsScope<'_>, def: &ModuleDef) -> String { fn mod_item_path(db: &dyn HirDatabase, sema_scope: &SemanticsScope<'_>, def: &ModuleDef) -> String {
// Account for locals shadowing items from module // Account for locals shadowing items from module
let name_hit_count = def.name(db).map(|def_name| { let name_hit_count = def.name(db).map(|def_name| {
@ -76,6 +77,11 @@ pub enum TypeTree {
} }
impl TypeTree { impl TypeTree {
/// Generate source code for type tree.
///
/// Note that trait imports are not added to generated code.
/// To make sure that the code is valid, callee has to also ensure that all the traits listed
/// by `traits_used` method are also imported.
pub fn gen_source_code(&self, sema_scope: &SemanticsScope<'_>) -> String { pub fn gen_source_code(&self, sema_scope: &SemanticsScope<'_>) -> String {
let db = sema_scope.db; let db = sema_scope.db;
match self { match self {
@ -222,6 +228,7 @@ pub fn ty(&self, db: &dyn HirDatabase) -> Type {
} }
} }
/// List the traits used in type tree
pub fn traits_used(&self, db: &dyn HirDatabase) -> Vec<Trait> { pub fn traits_used(&self, db: &dyn HirDatabase) -> Vec<Trait> {
let mut res = Vec::new(); let mut res = Vec::new();