Skip to main content

rustdoc/html/render/
search_index.rs

1pub(crate) mod encode;
2mod serde;
3
4use std::collections::BTreeSet;
5use std::collections::hash_map::Entry;
6use std::path::Path;
7use std::string::FromUtf8Error;
8use std::{io, iter};
9
10use ::serde::de::{self, Deserializer, Error as _};
11use ::serde::ser::{SerializeSeq, Serializer};
12use ::serde::{Deserialize, Serialize};
13use rustc_ast::join_path_syms;
14use rustc_data_structures::fx::{FxHashMap, FxHashSet, FxIndexMap};
15use rustc_data_structures::thin_vec::ThinVec;
16use rustc_hir::def_id::{CrateNum, DefIndex, LOCAL_CRATE};
17use rustc_hir::find_attr;
18use rustc_middle::ty::TyCtxt;
19use rustc_span::def_id::DefId;
20use rustc_span::sym;
21use rustc_span::symbol::{Symbol, kw};
22use stringdex::internals as stringdex_internals;
23use tracing::instrument;
24
25use crate::clean::types::{Function, Generics, ItemId, Type, WherePredicate};
26use crate::clean::{self, ExternalLocation, utils};
27use crate::config::ShouldMerge;
28use crate::error::Error;
29use crate::formats::cache::{Cache, OrphanImplItem};
30use crate::formats::item_type::ItemType;
31use crate::html::markdown::short_markdown_summary;
32use crate::html::render::{
33    self, IndexItem, IndexItemFunctionType, IndexItemInfo, RenderType, RenderTypeId,
34};
35
36#[derive(Clone, Debug, Default, Deserialize, Serialize)]
37pub(crate) struct SerializedSearchIndex {
38    // data from disk
39    names: Vec<String>,
40    path_data: Vec<Option<PathData>>,
41    entry_data: Vec<Option<EntryData>>,
42    descs: Vec<String>,
43    function_data: Vec<Option<IndexItemFunctionType>>,
44    alias_pointers: Vec<Option<usize>>,
45    // inverted index for concrete types and generics
46    type_data: Vec<Option<TypeData>>,
47    /// inverted index of generics
48    ///
49    /// - The outermost list has one entry per alpha-normalized generic.
50    ///
51    /// - The second layer is sorted by number of types that appear in the
52    ///   type signature. The search engine iterates over these in order from
53    ///   smallest to largest. Functions with less stuff in their type
54    ///   signature are more likely to be what the user wants, because we never
55    ///   show functions that are *missing* parts of the query, so removing..
56    ///
57    /// - The final layer is the list of functions.
58    generic_inverted_index: Vec<Vec<Vec<u32>>>,
59    // generated in-memory backref cache
60    #[serde(skip)]
61    crate_paths_index: FxHashMap<(ItemType, Vec<Symbol>), usize>,
62}
63
64impl SerializedSearchIndex {
65    fn load(doc_root: &Path, resource_suffix: &str) -> Result<SerializedSearchIndex, Error> {
66        let mut names: Vec<String> = Vec::new();
67        let mut path_data: Vec<Option<PathData>> = Vec::new();
68        let mut entry_data: Vec<Option<EntryData>> = Vec::new();
69        let mut descs: Vec<String> = Vec::new();
70        let mut function_data: Vec<Option<IndexItemFunctionType>> = Vec::new();
71        let mut type_data: Vec<Option<TypeData>> = Vec::new();
72        let mut alias_pointers: Vec<Option<usize>> = Vec::new();
73
74        let mut generic_inverted_index: Vec<Vec<Vec<u32>>> = Vec::new();
75
76        match perform_read_strings(resource_suffix, doc_root, "name", &mut names) {
77            Ok(()) => {
78                perform_read_serde(resource_suffix, doc_root, "path", &mut path_data)?;
79                perform_read_serde(resource_suffix, doc_root, "entry", &mut entry_data)?;
80                perform_read_strings(resource_suffix, doc_root, "desc", &mut descs)?;
81                perform_read_serde(resource_suffix, doc_root, "function", &mut function_data)?;
82                perform_read_serde(resource_suffix, doc_root, "type", &mut type_data)?;
83                perform_read_serde(resource_suffix, doc_root, "alias", &mut alias_pointers)?;
84                perform_read_postings(
85                    resource_suffix,
86                    doc_root,
87                    "generic_inverted_index",
88                    &mut generic_inverted_index,
89                )?;
90            }
91            Err(_) => {
92                names.clear();
93            }
94        }
95        fn perform_read_strings(
96            resource_suffix: &str,
97            doc_root: &Path,
98            column_name: &str,
99            column: &mut Vec<String>,
100        ) -> Result<(), Error> {
101            let root_path = doc_root.join(format!("search.index/root{resource_suffix}.js"));
102            let column_path = doc_root.join(format!("search.index/{column_name}/"));
103
104            let mut consume = |_, cell: &[u8]| {
105                column.push(String::from_utf8(cell.to_vec())?);
106                Ok::<_, FromUtf8Error>(())
107            };
108
109            stringdex_internals::read_data_from_disk_column(
110                root_path,
111                column_name.as_bytes(),
112                column_path.clone(),
113                &mut consume,
114            )
115            .map_err(|error| Error {
116                file: column_path,
117                error: format!("failed to read column from disk: {error}"),
118            })
119        }
120        fn perform_read_serde(
121            resource_suffix: &str,
122            doc_root: &Path,
123            column_name: &str,
124            column: &mut Vec<Option<impl for<'de> Deserialize<'de> + 'static>>,
125        ) -> Result<(), Error> {
126            let root_path = doc_root.join(format!("search.index/root{resource_suffix}.js"));
127            let column_path = doc_root.join(format!("search.index/{column_name}/"));
128
129            let mut consume = |_, cell: &[u8]| {
130                if cell.is_empty() {
131                    column.push(None);
132                } else {
133                    column.push(Some(serde_json::from_slice(cell)?));
134                }
135                Ok::<_, serde_json::Error>(())
136            };
137
138            stringdex_internals::read_data_from_disk_column(
139                root_path,
140                column_name.as_bytes(),
141                column_path.clone(),
142                &mut consume,
143            )
144            .map_err(|error| Error {
145                file: column_path,
146                error: format!("failed to read column from disk: {error}"),
147            })
148        }
149        fn perform_read_postings(
150            resource_suffix: &str,
151            doc_root: &Path,
152            column_name: &str,
153            column: &mut Vec<Vec<Vec<u32>>>,
154        ) -> Result<(), Error> {
155            let root_path = doc_root.join(format!("search.index/root{resource_suffix}.js"));
156            let column_path = doc_root.join(format!("search.index/{column_name}/"));
157
158            fn consumer(
159                column: &mut Vec<Vec<Vec<u32>>>,
160            ) -> impl FnMut(u32, &[u8]) -> io::Result<()> {
161                |_, cell| {
162                    let mut postings = Vec::new();
163                    encode::read_postings_from_string(&mut postings, cell);
164                    column.push(postings);
165                    Ok(())
166                }
167            }
168
169            stringdex_internals::read_data_from_disk_column(
170                root_path,
171                column_name.as_bytes(),
172                column_path.clone(),
173                &mut consumer(column),
174            )
175            .map_err(|error| Error {
176                file: column_path,
177                error: format!("failed to read column from disk: {error}"),
178            })
179        }
180
181        assert_eq!(names.len(), path_data.len());
182        assert_eq!(path_data.len(), entry_data.len());
183        assert_eq!(entry_data.len(), descs.len());
184        assert_eq!(descs.len(), function_data.len());
185        assert_eq!(function_data.len(), type_data.len());
186        assert_eq!(type_data.len(), alias_pointers.len());
187
188        // generic_inverted_index is not the same length as other columns,
189        // because it's actually a completely different set of objects
190
191        let mut crate_paths_index: FxHashMap<(ItemType, Vec<Symbol>), usize> = FxHashMap::default();
192        for (i, (name, path_data)) in names.iter().zip(path_data.iter()).enumerate() {
193            if let Some(path_data) = path_data {
194                let full_path = if path_data.module_path.is_empty() {
195                    vec![Symbol::intern(name)]
196                } else {
197                    let mut full_path = path_data.module_path.to_vec();
198                    full_path.push(Symbol::intern(name));
199                    full_path
200                };
201                crate_paths_index.insert((path_data.ty, full_path), i);
202            }
203        }
204
205        Ok(SerializedSearchIndex {
206            names,
207            path_data,
208            entry_data,
209            descs,
210            function_data,
211            type_data,
212            alias_pointers,
213            generic_inverted_index,
214            crate_paths_index,
215        })
216    }
217    fn push(
218        &mut self,
219        name: String,
220        path_data: Option<PathData>,
221        entry_data: Option<EntryData>,
222        desc: String,
223        function_data: Option<IndexItemFunctionType>,
224        type_data: Option<TypeData>,
225        alias_pointer: Option<usize>,
226    ) -> usize {
227        let index = self.names.len();
228        assert_eq!(self.names.len(), self.path_data.len());
229        if let Some(path_data) = &path_data
230            && let name = Symbol::intern(&name)
231            && let fqp = if path_data.module_path.is_empty() {
232                vec![name]
233            } else {
234                let mut v = path_data.module_path.clone();
235                v.push(name);
236                v
237            }
238            && let Some(&other_path) = self.crate_paths_index.get(&(path_data.ty, fqp))
239            && self.path_data.get(other_path).map_or(false, Option::is_some)
240        {
241            self.path_data.push(None);
242        } else {
243            self.path_data.push(path_data);
244        }
245        self.names.push(name);
246        assert_eq!(self.entry_data.len(), self.descs.len());
247        self.entry_data.push(entry_data);
248        assert_eq!(self.descs.len(), self.function_data.len());
249        self.descs.push(desc);
250        assert_eq!(self.function_data.len(), self.type_data.len());
251        self.function_data.push(function_data);
252        assert_eq!(self.type_data.len(), self.alias_pointers.len());
253        self.type_data.push(type_data);
254        self.alias_pointers.push(alias_pointer);
255        index
256    }
257    /// Add potential search result to the database and return the row ID.
258    ///
259    /// The returned ID can be used to attach more data to the search result.
260    fn add_entry(&mut self, name: Symbol, entry_data: EntryData, desc: String) -> usize {
261        let fqp = if let Some(module_path_index) = entry_data.module_path {
262            self.path_data[module_path_index]
263                .as_ref()
264                .unwrap()
265                .module_path
266                .iter()
267                .copied()
268                .chain([Symbol::intern(&self.names[module_path_index]), name])
269                .collect()
270        } else {
271            vec![name]
272        };
273        // If a path with the same name already exists, but no entry does,
274        // we can fill in the entry without having to allocate a new row ID.
275        //
276        // Because paths and entries both share the same index, using the same
277        // ID saves space by making the tree smaller.
278        if let Some(&other_path) = self.crate_paths_index.get(&(entry_data.ty, fqp))
279            && self.entry_data[other_path].is_none()
280            && self.descs[other_path].is_empty()
281        {
282            self.entry_data[other_path] = Some(entry_data);
283            self.descs[other_path] = desc;
284            other_path
285        } else {
286            self.push(name.as_str().to_string(), None, Some(entry_data), desc, None, None, None)
287        }
288    }
289    fn push_path(&mut self, name: String, path_data: PathData) -> usize {
290        self.push(name, Some(path_data), None, String::new(), None, None, None)
291    }
292    fn push_type(&mut self, name: String, path_data: PathData, type_data: TypeData) -> usize {
293        self.push(name, Some(path_data), None, String::new(), None, Some(type_data), None)
294    }
295    fn push_alias(&mut self, name: String, alias_pointer: usize) -> usize {
296        self.push(name, None, None, String::new(), None, None, Some(alias_pointer))
297    }
298
299    fn get_id_by_module_path(&mut self, path: &[Symbol]) -> usize {
300        let ty = if path.len() == 1 { ItemType::ExternCrate } else { ItemType::Module };
301        match self.crate_paths_index.entry((ty, path.to_vec())) {
302            Entry::Occupied(index) => *index.get(),
303            Entry::Vacant(slot) => {
304                slot.insert(self.path_data.len());
305                let (name, module_path) = path.split_last().unwrap();
306                self.push_path(
307                    name.as_str().to_string(),
308                    PathData { ty, module_path: module_path.to_vec(), exact_module_path: None },
309                )
310            }
311        }
312    }
313
314    pub(crate) fn union(mut self, other: &SerializedSearchIndex) -> SerializedSearchIndex {
315        let other_entryid_offset = self.names.len();
316        let mut map_other_pathid_to_self_pathid = Vec::new();
317        let mut skips = FxHashSet::default();
318        for (other_pathid, other_path_data) in other.path_data.iter().enumerate() {
319            if let Some(other_path_data) = other_path_data {
320                let name = Symbol::intern(&other.names[other_pathid]);
321                let fqp =
322                    other_path_data.module_path.iter().copied().chain(iter::once(name)).collect();
323                let self_pathid = other_entryid_offset + other_pathid;
324                let self_pathid = match self.crate_paths_index.entry((other_path_data.ty, fqp)) {
325                    Entry::Vacant(slot) => {
326                        slot.insert(self_pathid);
327                        self_pathid
328                    }
329                    Entry::Occupied(existing_entryid) => {
330                        skips.insert(other_pathid);
331                        let self_pathid = *existing_entryid.get();
332                        let new_type_data = match (
333                            self.type_data[self_pathid].take(),
334                            other.type_data[other_pathid].as_ref(),
335                        ) {
336                            (Some(self_type_data), None) => Some(self_type_data),
337                            (None, Some(other_type_data)) => Some(TypeData {
338                                search_unbox: other_type_data.search_unbox,
339                                inverted_function_inputs_index: other_type_data
340                                    .inverted_function_inputs_index
341                                    .iter()
342                                    .cloned()
343                                    .map(|mut list: Vec<u32>| {
344                                        for fnid in &mut list {
345                                            assert!(
346                                                other.function_data
347                                                    [usize::try_from(*fnid).unwrap()]
348                                                .is_some(),
349                                            );
350                                            // this is valid because we call `self.push()` once, exactly, for every entry,
351                                            // even if we're just pushing a tombstone
352                                            *fnid += u32::try_from(other_entryid_offset).unwrap();
353                                        }
354                                        list
355                                    })
356                                    .collect(),
357                                inverted_function_output_index: other_type_data
358                                    .inverted_function_output_index
359                                    .iter()
360                                    .cloned()
361                                    .map(|mut list: Vec<u32>| {
362                                        for fnid in &mut list {
363                                            assert!(
364                                                other.function_data
365                                                    [usize::try_from(*fnid).unwrap()]
366                                                .is_some(),
367                                            );
368                                            // this is valid because we call `self.push()` once, exactly, for every entry,
369                                            // even if we're just pushing a tombstone
370                                            *fnid += u32::try_from(other_entryid_offset).unwrap();
371                                        }
372                                        list
373                                    })
374                                    .collect(),
375                            }),
376                            (Some(mut self_type_data), Some(other_type_data)) => {
377                                for (size, other_list) in other_type_data
378                                    .inverted_function_inputs_index
379                                    .iter()
380                                    .enumerate()
381                                {
382                                    while self_type_data.inverted_function_inputs_index.len()
383                                        <= size
384                                    {
385                                        self_type_data
386                                            .inverted_function_inputs_index
387                                            .push(Vec::new());
388                                    }
389                                    self_type_data.inverted_function_inputs_index[size].extend(
390                                        other_list.iter().copied().map(|fnid| {
391                                            assert!(
392                                                other.function_data[usize::try_from(fnid).unwrap()]
393                                                    .is_some(),
394                                            );
395                                            // this is valid because we call `self.push()` once, exactly, for every entry,
396                                            // even if we're just pushing a tombstone
397                                            fnid + u32::try_from(other_entryid_offset).unwrap()
398                                        }),
399                                    )
400                                }
401                                for (size, other_list) in other_type_data
402                                    .inverted_function_output_index
403                                    .iter()
404                                    .enumerate()
405                                {
406                                    while self_type_data.inverted_function_output_index.len()
407                                        <= size
408                                    {
409                                        self_type_data
410                                            .inverted_function_output_index
411                                            .push(Vec::new());
412                                    }
413                                    self_type_data.inverted_function_output_index[size].extend(
414                                        other_list.iter().copied().map(|fnid| {
415                                            assert!(
416                                                other.function_data[usize::try_from(fnid).unwrap()]
417                                                    .is_some(),
418                                            );
419                                            // this is valid because we call `self.push()` once, exactly, for every entry,
420                                            // even if we're just pushing a tombstone
421                                            fnid + u32::try_from(other_entryid_offset).unwrap()
422                                        }),
423                                    )
424                                }
425                                Some(self_type_data)
426                            }
427                            (None, None) => None,
428                        };
429                        self.type_data[self_pathid] = new_type_data;
430                        self_pathid
431                    }
432                };
433                map_other_pathid_to_self_pathid.push(self_pathid);
434            } else {
435                // if this gets used, we want it to crash
436                // this should be impossible as a valid index, since some of the
437                // memory must be used for stuff other than the list
438                map_other_pathid_to_self_pathid.push(!0);
439            }
440        }
441        for other_entryid in 0..other.names.len() {
442            if skips.contains(&other_entryid) {
443                // we push tombstone entries to keep the IDs lined up
444                self.push(String::new(), None, None, String::new(), None, None, None);
445            } else {
446                self.push(
447                    other.names[other_entryid].clone(),
448                    other.path_data[other_entryid].clone(),
449                    other.entry_data[other_entryid].as_ref().map(|other_entry_data| EntryData {
450                        parent: other_entry_data
451                            .parent
452                            .map(|parent| map_other_pathid_to_self_pathid[parent])
453                            .clone(),
454                        module_path: other_entry_data
455                            .module_path
456                            .map(|path| map_other_pathid_to_self_pathid[path])
457                            .clone(),
458                        exact_module_path: other_entry_data
459                            .exact_module_path
460                            .map(|exact_path| map_other_pathid_to_self_pathid[exact_path])
461                            .clone(),
462                        krate: map_other_pathid_to_self_pathid[other_entry_data.krate],
463                        ..other_entry_data.clone()
464                    }),
465                    other.descs[other_entryid].clone(),
466                    other.function_data[other_entryid].clone().map(|mut func| {
467                        fn map_fn_sig_item(
468                            map_other_pathid_to_self_pathid: &Vec<usize>,
469                            ty: &mut RenderType,
470                        ) {
471                            match ty.id {
472                                None => {}
473                                Some(RenderTypeId::Index(generic)) if generic < 0 => {}
474                                Some(RenderTypeId::Index(id)) => {
475                                    let id = usize::try_from(id).unwrap();
476                                    let id = map_other_pathid_to_self_pathid[id];
477                                    assert!(id != !0);
478                                    ty.id = Some(RenderTypeId::Index(isize::try_from(id).unwrap()));
479                                }
480                                _ => unreachable!(),
481                            }
482                            if let Some(generics) = &mut ty.generics {
483                                for generic in generics {
484                                    map_fn_sig_item(map_other_pathid_to_self_pathid, generic);
485                                }
486                            }
487                            if let Some(bindings) = &mut ty.bindings {
488                                for (param, constraints) in bindings {
489                                    *param = match *param {
490                                        param @ RenderTypeId::Index(generic) if generic < 0 => {
491                                            param
492                                        }
493                                        RenderTypeId::Index(id) => {
494                                            let id = usize::try_from(id).unwrap();
495                                            let id = map_other_pathid_to_self_pathid[id];
496                                            assert!(id != !0);
497                                            RenderTypeId::Index(isize::try_from(id).unwrap())
498                                        }
499                                        _ => unreachable!(),
500                                    };
501                                    for constraint in constraints {
502                                        map_fn_sig_item(
503                                            map_other_pathid_to_self_pathid,
504                                            constraint,
505                                        );
506                                    }
507                                }
508                            }
509                        }
510                        for input in &mut func.inputs {
511                            map_fn_sig_item(&map_other_pathid_to_self_pathid, input);
512                        }
513                        for output in &mut func.output {
514                            map_fn_sig_item(&map_other_pathid_to_self_pathid, output);
515                        }
516                        for clause in &mut func.where_clause {
517                            for entry in clause {
518                                map_fn_sig_item(&map_other_pathid_to_self_pathid, entry);
519                            }
520                        }
521                        func
522                    }),
523                    other.type_data[other_entryid].as_ref().map(|type_data| TypeData {
524                        inverted_function_inputs_index: type_data
525                            .inverted_function_inputs_index
526                            .iter()
527                            .cloned()
528                            .map(|mut list| {
529                                for fnid in &mut list {
530                                    assert!(
531                                        other.function_data[usize::try_from(*fnid).unwrap()]
532                                            .is_some(),
533                                    );
534                                    // this is valid because we call `self.push()` once, exactly, for every entry,
535                                    // even if we're just pushing a tombstone
536                                    *fnid += u32::try_from(other_entryid_offset).unwrap();
537                                }
538                                list
539                            })
540                            .collect(),
541                        inverted_function_output_index: type_data
542                            .inverted_function_output_index
543                            .iter()
544                            .cloned()
545                            .map(|mut list| {
546                                for fnid in &mut list {
547                                    assert!(
548                                        other.function_data[usize::try_from(*fnid).unwrap()]
549                                            .is_some(),
550                                    );
551                                    // this is valid because we call `self.push()` once, exactly, for every entry,
552                                    // even if we're just pushing a tombstone
553                                    *fnid += u32::try_from(other_entryid_offset).unwrap();
554                                }
555                                list
556                            })
557                            .collect(),
558                        search_unbox: type_data.search_unbox,
559                    }),
560                    other.alias_pointers[other_entryid]
561                        .map(|alias_pointer| alias_pointer + other_entryid_offset),
562                );
563            }
564        }
565        if other.generic_inverted_index.len() > self.generic_inverted_index.len() {
566            self.generic_inverted_index.resize(other.generic_inverted_index.len(), Vec::new());
567        }
568        for (other_generic_inverted_index, self_generic_inverted_index) in
569            iter::zip(&other.generic_inverted_index, &mut self.generic_inverted_index)
570        {
571            if other_generic_inverted_index.len() > self_generic_inverted_index.len() {
572                self_generic_inverted_index.resize(other_generic_inverted_index.len(), Vec::new());
573            }
574            for (other_list, self_list) in
575                iter::zip(other_generic_inverted_index, self_generic_inverted_index)
576            {
577                self_list.extend(
578                    other_list
579                        .iter()
580                        .copied()
581                        .map(|fnid| fnid + u32::try_from(other_entryid_offset).unwrap()),
582                );
583            }
584        }
585        self
586    }
587
588    pub(crate) fn sort(self) -> SerializedSearchIndex {
589        let mut idlist: Vec<usize> = (0..self.names.len()).collect();
590        // nameless entries are tombstones, and will be removed after sorting
591        // sort shorter names first, so that we can present them in order out of search.js
592        idlist.sort_by_key(|&id| {
593            (
594                self.names[id].is_empty(),
595                self.names[id].len(),
596                &self.names[id],
597                self.entry_data[id].as_ref().map_or("", |entry| self.names[entry.krate].as_str()),
598                self.path_data[id].as_ref().map_or(&[][..], |entry| &entry.module_path[..]),
599            )
600        });
601        let map = FxHashMap::from_iter(
602            idlist.iter().enumerate().map(|(new_id, &old_id)| (old_id, new_id)),
603        );
604        let mut new = SerializedSearchIndex::default();
605        for &id in &idlist {
606            if self.names[id].is_empty() {
607                break;
608            }
609            new.push(
610                self.names[id].clone(),
611                self.path_data[id].clone(),
612                self.entry_data[id].as_ref().map(
613                    |EntryData {
614                         krate,
615                         ty,
616                         module_path,
617                         exact_module_path,
618                         parent,
619                         trait_parent,
620                         deprecated,
621                         unstable,
622                         associated_item_disambiguator_or_extern_crate_url:
623                             associated_item_disambiguator,
624                     }| EntryData {
625                        krate: *map.get(krate).unwrap(),
626                        ty: *ty,
627                        module_path: module_path.and_then(|path_id| map.get(&path_id).copied()),
628                        exact_module_path: exact_module_path
629                            .and_then(|path_id| map.get(&path_id).copied()),
630                        parent: parent.and_then(|path_id| map.get(&path_id).copied()),
631                        trait_parent: trait_parent.and_then(|path_id| map.get(&path_id).copied()),
632                        deprecated: *deprecated,
633                        unstable: *unstable,
634                        associated_item_disambiguator_or_extern_crate_url:
635                            associated_item_disambiguator.clone(),
636                    },
637                ),
638                self.descs[id].clone(),
639                self.function_data[id].clone().map(|mut func| {
640                    fn map_fn_sig_item(map: &FxHashMap<usize, usize>, ty: &mut RenderType) {
641                        match ty.id {
642                            None => {}
643                            Some(RenderTypeId::Index(generic)) if generic < 0 => {}
644                            Some(RenderTypeId::Index(id)) => {
645                                let id = usize::try_from(id).unwrap();
646                                let id = *map.get(&id).unwrap();
647                                assert!(id != !0);
648                                ty.id = Some(RenderTypeId::Index(isize::try_from(id).unwrap()));
649                            }
650                            _ => unreachable!(),
651                        }
652                        if let Some(generics) = &mut ty.generics {
653                            for generic in generics {
654                                map_fn_sig_item(map, generic);
655                            }
656                        }
657                        if let Some(bindings) = &mut ty.bindings {
658                            for (param, constraints) in bindings {
659                                *param = match *param {
660                                    param @ RenderTypeId::Index(generic) if generic < 0 => param,
661                                    RenderTypeId::Index(id) => {
662                                        let id = usize::try_from(id).unwrap();
663                                        let id = *map.get(&id).unwrap();
664                                        assert!(id != !0);
665                                        RenderTypeId::Index(isize::try_from(id).unwrap())
666                                    }
667                                    _ => unreachable!(),
668                                };
669                                for constraint in constraints {
670                                    map_fn_sig_item(map, constraint);
671                                }
672                            }
673                        }
674                    }
675                    for input in &mut func.inputs {
676                        map_fn_sig_item(&map, input);
677                    }
678                    for output in &mut func.output {
679                        map_fn_sig_item(&map, output);
680                    }
681                    for clause in &mut func.where_clause {
682                        for entry in clause {
683                            map_fn_sig_item(&map, entry);
684                        }
685                    }
686                    func
687                }),
688                self.type_data[id].as_ref().map(
689                    |TypeData {
690                         search_unbox,
691                         inverted_function_inputs_index,
692                         inverted_function_output_index,
693                     }| {
694                        let inverted_function_inputs_index: Vec<Vec<u32>> =
695                            inverted_function_inputs_index
696                                .iter()
697                                .cloned()
698                                .map(|mut list| {
699                                    for id in &mut list {
700                                        *id = u32::try_from(
701                                            *map.get(&usize::try_from(*id).unwrap()).unwrap(),
702                                        )
703                                        .unwrap();
704                                    }
705                                    list.sort();
706                                    list
707                                })
708                                .collect();
709                        let inverted_function_output_index: Vec<Vec<u32>> =
710                            inverted_function_output_index
711                                .iter()
712                                .cloned()
713                                .map(|mut list| {
714                                    for id in &mut list {
715                                        *id = u32::try_from(
716                                            *map.get(&usize::try_from(*id).unwrap()).unwrap(),
717                                        )
718                                        .unwrap();
719                                    }
720                                    list.sort();
721                                    list
722                                })
723                                .collect();
724                        TypeData {
725                            search_unbox: *search_unbox,
726                            inverted_function_inputs_index,
727                            inverted_function_output_index,
728                        }
729                    },
730                ),
731                self.alias_pointers[id].and_then(|alias| {
732                    if self.names[alias].is_empty() { None } else { map.get(&alias).copied() }
733                }),
734            );
735        }
736        new.generic_inverted_index = self
737            .generic_inverted_index
738            .into_iter()
739            .map(|mut postings| {
740                for list in postings.iter_mut() {
741                    let mut new_list: Vec<u32> = list
742                        .iter()
743                        .copied()
744                        .filter_map(|id| u32::try_from(*map.get(&usize::try_from(id).ok()?)?).ok())
745                        .collect();
746                    new_list.sort();
747                    *list = new_list;
748                }
749                postings
750            })
751            .collect();
752        new
753    }
754
755    pub(crate) fn write_to(self, doc_root: &Path, resource_suffix: &str) -> Result<(), Error> {
756        let SerializedSearchIndex {
757            names,
758            path_data,
759            entry_data,
760            descs,
761            function_data,
762            type_data,
763            alias_pointers,
764            generic_inverted_index,
765            crate_paths_index: _,
766        } = self;
767        let mut serialized_root = Vec::new();
768        serialized_root.extend_from_slice(br#"rr_('{"normalizedName":{"I":""#);
769        let normalized_names = names
770            .iter()
771            .map(|name| {
772                if name.contains("_") {
773                    name.replace("_", "").to_ascii_lowercase()
774                } else {
775                    name.to_ascii_lowercase()
776                }
777            })
778            .collect::<Vec<String>>();
779        let names_search_tree = stringdex_internals::tree::encode_search_tree_ukkonen(
780            normalized_names.iter().map(|name| name.as_bytes()),
781        );
782        let dir_path = doc_root.join(format!("search.index/"));
783        let _ = std::fs::remove_dir_all(&dir_path); // if already missing, no problem
784        stringdex_internals::write_tree_to_disk(
785            &names_search_tree,
786            &dir_path,
787            &mut serialized_root,
788        )
789        .map_err(|error| Error {
790            file: dir_path,
791            error: format!("failed to write name tree to disk: {error}"),
792        })?;
793        std::mem::drop(names_search_tree);
794        serialized_root.extend_from_slice(br#"","#);
795        serialized_root.extend_from_slice(&perform_write_strings(
796            doc_root,
797            "normalizedName",
798            normalized_names.into_iter(),
799        )?);
800        serialized_root.extend_from_slice(br#"},"crateNames":{"#);
801        let mut crates: Vec<&[u8]> = entry_data
802            .iter()
803            .filter_map(|entry_data| Some(names[entry_data.as_ref()?.krate].as_bytes()))
804            .collect();
805        crates.sort();
806        crates.dedup();
807        serialized_root.extend_from_slice(&perform_write_strings(
808            doc_root,
809            "crateNames",
810            crates.into_iter(),
811        )?);
812        serialized_root.extend_from_slice(br#"},"name":{"#);
813        serialized_root.extend_from_slice(&perform_write_strings(doc_root, "name", names.iter())?);
814        serialized_root.extend_from_slice(br#"},"path":{"#);
815        serialized_root.extend_from_slice(&perform_write_serde(doc_root, "path", path_data)?);
816        serialized_root.extend_from_slice(br#"},"entry":{"#);
817        serialized_root.extend_from_slice(&perform_write_serde(doc_root, "entry", entry_data)?);
818        serialized_root.extend_from_slice(br#"},"desc":{"#);
819        serialized_root.extend_from_slice(&perform_write_strings(
820            doc_root,
821            "desc",
822            descs.into_iter(),
823        )?);
824        serialized_root.extend_from_slice(br#"},"function":{"#);
825        serialized_root.extend_from_slice(&perform_write_serde(
826            doc_root,
827            "function",
828            function_data,
829        )?);
830        serialized_root.extend_from_slice(br#"},"type":{"#);
831        serialized_root.extend_from_slice(&perform_write_serde(doc_root, "type", type_data)?);
832        serialized_root.extend_from_slice(br#"},"alias":{"#);
833        serialized_root.extend_from_slice(&perform_write_serde(doc_root, "alias", alias_pointers)?);
834        serialized_root.extend_from_slice(br#"},"generic_inverted_index":{"#);
835        serialized_root.extend_from_slice(&perform_write_postings(
836            doc_root,
837            "generic_inverted_index",
838            generic_inverted_index,
839        )?);
840        serialized_root.extend_from_slice(br#"}}')"#);
841        fn perform_write_strings(
842            doc_root: &Path,
843            dirname: &str,
844            mut column: impl Iterator<Item = impl AsRef<[u8]> + Clone> + ExactSizeIterator,
845        ) -> Result<Vec<u8>, Error> {
846            let dir_path = doc_root.join(format!("search.index/{dirname}"));
847            stringdex_internals::write_data_to_disk(&mut column, &dir_path).map_err(|error| Error {
848                file: dir_path,
849                error: format!("failed to write column to disk: {error}"),
850            })
851        }
852        fn perform_write_serde(
853            doc_root: &Path,
854            dirname: &str,
855            column: Vec<Option<impl Serialize>>,
856        ) -> Result<Vec<u8>, Error> {
857            perform_write_strings(
858                doc_root,
859                dirname,
860                column.into_iter().map(|value| {
861                    if let Some(value) = value {
862                        serde_json::to_vec(&value).unwrap()
863                    } else {
864                        Vec::new()
865                    }
866                }),
867            )
868        }
869        fn perform_write_postings(
870            doc_root: &Path,
871            dirname: &str,
872            column: Vec<Vec<Vec<u32>>>,
873        ) -> Result<Vec<u8>, Error> {
874            perform_write_strings(
875                doc_root,
876                dirname,
877                column.into_iter().map(|postings| {
878                    let mut buf = Vec::new();
879                    encode::write_postings_to_string(&postings, &mut buf);
880                    buf
881                }),
882            )
883        }
884        std::fs::write(
885            doc_root.join(format!("search.index/root{resource_suffix}.js")),
886            serialized_root,
887        )
888        .map_err(|error| Error {
889            file: doc_root.join(format!("search.index/root{resource_suffix}.js")),
890            error: format!("failed to write root to disk: {error}"),
891        })?;
892        Ok(())
893    }
894}
895
896#[derive(Clone, Debug)]
897struct EntryData {
898    krate: usize,
899    ty: ItemType,
900    module_path: Option<usize>,
901    exact_module_path: Option<usize>,
902    parent: Option<usize>,
903    trait_parent: Option<usize>,
904    deprecated: bool,
905    unstable: bool,
906    associated_item_disambiguator_or_extern_crate_url: Option<String>,
907}
908
909impl Serialize for EntryData {
910    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
911    where
912        S: Serializer,
913    {
914        let mut seq = serializer.serialize_seq(None)?;
915        seq.serialize_element(&self.krate)?;
916        seq.serialize_element(&self.ty)?;
917        seq.serialize_element(&self.module_path.map(|id| id + 1).unwrap_or(0))?;
918        seq.serialize_element(&self.exact_module_path.map(|id| id + 1).unwrap_or(0))?;
919        seq.serialize_element(&self.parent.map(|id| id + 1).unwrap_or(0))?;
920        seq.serialize_element(&self.trait_parent.map(|id| id + 1).unwrap_or(0))?;
921        seq.serialize_element(&if self.deprecated { 1 } else { 0 })?;
922        seq.serialize_element(&if self.unstable { 1 } else { 0 })?;
923        if let Some(disambig) = &self.associated_item_disambiguator_or_extern_crate_url {
924            seq.serialize_element(&disambig)?;
925        }
926        seq.end()
927    }
928}
929
930impl<'de> Deserialize<'de> for EntryData {
931    fn deserialize<D>(deserializer: D) -> Result<EntryData, D::Error>
932    where
933        D: Deserializer<'de>,
934    {
935        struct EntryDataVisitor;
936        impl<'de> de::Visitor<'de> for EntryDataVisitor {
937            type Value = EntryData;
938            fn expecting(&self, formatter: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
939                write!(formatter, "path data")
940            }
941            fn visit_seq<A: de::SeqAccess<'de>>(self, mut v: A) -> Result<EntryData, A::Error> {
942                let krate: usize =
943                    v.next_element()?.ok_or_else(|| A::Error::missing_field("krate"))?;
944                let ty: ItemType =
945                    v.next_element()?.ok_or_else(|| A::Error::missing_field("ty"))?;
946                let module_path: SerializedOptional32 =
947                    v.next_element()?.ok_or_else(|| A::Error::missing_field("module_path"))?;
948                let exact_module_path: SerializedOptional32 = v
949                    .next_element()?
950                    .ok_or_else(|| A::Error::missing_field("exact_module_path"))?;
951                let parent: SerializedOptional32 =
952                    v.next_element()?.ok_or_else(|| A::Error::missing_field("parent"))?;
953                let trait_parent: SerializedOptional32 =
954                    v.next_element()?.ok_or_else(|| A::Error::missing_field("trait_parent"))?;
955
956                let deprecated: u32 = v.next_element()?.unwrap_or(0);
957                let unstable: u32 = v.next_element()?.unwrap_or(0);
958                let associated_item_disambiguator: Option<String> = v.next_element()?;
959                Ok(EntryData {
960                    krate,
961                    ty,
962                    module_path: Option::<i32>::from(module_path).map(|path| path as usize),
963                    exact_module_path: Option::<i32>::from(exact_module_path)
964                        .map(|path| path as usize),
965                    parent: Option::<i32>::from(parent).map(|path| path as usize),
966                    trait_parent: Option::<i32>::from(trait_parent).map(|path| path as usize),
967                    deprecated: deprecated != 0,
968                    unstable: unstable != 0,
969                    associated_item_disambiguator_or_extern_crate_url:
970                        associated_item_disambiguator,
971                })
972            }
973        }
974        deserializer.deserialize_any(EntryDataVisitor)
975    }
976}
977
978#[derive(Clone, Debug)]
979struct PathData {
980    ty: ItemType,
981    module_path: Vec<Symbol>,
982    exact_module_path: Option<Vec<Symbol>>,
983}
984
985impl Serialize for PathData {
986    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
987    where
988        S: Serializer,
989    {
990        let mut seq = serializer.serialize_seq(None)?;
991        seq.serialize_element(&self.ty)?;
992        seq.serialize_element(&if self.module_path.is_empty() {
993            String::new()
994        } else {
995            join_path_syms(&self.module_path)
996        })?;
997        if let Some(ref path) = self.exact_module_path {
998            seq.serialize_element(&if path.is_empty() {
999                String::new()
1000            } else {
1001                join_path_syms(path)
1002            })?;
1003        }
1004        seq.end()
1005    }
1006}
1007
1008impl<'de> Deserialize<'de> for PathData {
1009    fn deserialize<D>(deserializer: D) -> Result<PathData, D::Error>
1010    where
1011        D: Deserializer<'de>,
1012    {
1013        struct PathDataVisitor;
1014        impl<'de> de::Visitor<'de> for PathDataVisitor {
1015            type Value = PathData;
1016            fn expecting(&self, formatter: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
1017                write!(formatter, "path data")
1018            }
1019            fn visit_seq<A: de::SeqAccess<'de>>(self, mut v: A) -> Result<PathData, A::Error> {
1020                let ty: ItemType =
1021                    v.next_element()?.ok_or_else(|| A::Error::missing_field("ty"))?;
1022                let module_path: String =
1023                    v.next_element()?.ok_or_else(|| A::Error::missing_field("module_path"))?;
1024                let exact_module_path: Option<String> =
1025                    v.next_element()?.and_then(SerializedOptionalString::into);
1026                Ok(PathData {
1027                    ty,
1028                    module_path: if module_path.is_empty() {
1029                        vec![]
1030                    } else {
1031                        module_path.split("::").map(Symbol::intern).collect()
1032                    },
1033                    exact_module_path: exact_module_path.map(|path| {
1034                        if path.is_empty() {
1035                            vec![]
1036                        } else {
1037                            path.split("::").map(Symbol::intern).collect()
1038                        }
1039                    }),
1040                })
1041            }
1042        }
1043        deserializer.deserialize_any(PathDataVisitor)
1044    }
1045}
1046
1047#[derive(Clone, Debug)]
1048struct TypeData {
1049    /// If set to "true", the generics can be matched without having to
1050    /// mention the type itself. The truth table, assuming `Unboxable`
1051    /// has `search_unbox = true` and `Inner` has `search_unbox = false`
1052    ///
1053    /// | **query**          | `Unboxable<Inner>` | `Inner` | `Inner<Unboxable>` |
1054    /// |--------------------|--------------------|---------|--------------------|
1055    /// | `Inner`            | yes                | yes     | yes                |
1056    /// | `Unboxable`        | yes                | no      | no                 |
1057    /// | `Unboxable<Inner>` | yes                | no      | no                 |
1058    /// | `Inner<Unboxable>` | no                 | no      | yes                |
1059    search_unbox: bool,
1060    /// List of functions that mention this type in their type signature,
1061    /// on the left side of the `->` arrow.
1062    ///
1063    /// - The outer layer is sorted by number of types that appear in the
1064    ///   type signature. The search engine iterates over these in order from
1065    ///   smallest to largest. Functions with less stuff in their type
1066    ///   signature are more likely to be what the user wants, because we never
1067    ///   show functions that are *missing* parts of the query, so removing..
1068    ///
1069    /// - The inner layer is the list of functions.
1070    inverted_function_inputs_index: Vec<Vec<u32>>,
1071    /// List of functions that mention this type in their type signature,
1072    /// on the right side of the `->` arrow.
1073    inverted_function_output_index: Vec<Vec<u32>>,
1074}
1075
1076impl Serialize for TypeData {
1077    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
1078    where
1079        S: Serializer,
1080    {
1081        let mut seq = serializer.serialize_seq(None)?;
1082        let mut buf = Vec::new();
1083        encode::write_postings_to_string(&self.inverted_function_inputs_index, &mut buf);
1084        let mut serialized_result = Vec::new();
1085        stringdex_internals::encode::write_base64_to_bytes(&buf, &mut serialized_result).unwrap();
1086        seq.serialize_element(&str::from_utf8(&serialized_result).unwrap())?;
1087        buf.clear();
1088        serialized_result.clear();
1089        encode::write_postings_to_string(&self.inverted_function_output_index, &mut buf);
1090        stringdex_internals::encode::write_base64_to_bytes(&buf, &mut serialized_result).unwrap();
1091        seq.serialize_element(&str::from_utf8(&serialized_result).unwrap())?;
1092        if self.search_unbox {
1093            seq.serialize_element(&1)?;
1094        }
1095        seq.end()
1096    }
1097}
1098
1099impl<'de> Deserialize<'de> for TypeData {
1100    fn deserialize<D>(deserializer: D) -> Result<TypeData, D::Error>
1101    where
1102        D: Deserializer<'de>,
1103    {
1104        struct TypeDataVisitor;
1105        impl<'de> de::Visitor<'de> for TypeDataVisitor {
1106            type Value = TypeData;
1107            fn expecting(&self, formatter: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
1108                write!(formatter, "type data")
1109            }
1110            fn visit_none<E>(self) -> Result<TypeData, E> {
1111                Ok(TypeData {
1112                    inverted_function_inputs_index: vec![],
1113                    inverted_function_output_index: vec![],
1114                    search_unbox: false,
1115                })
1116            }
1117            fn visit_seq<A: de::SeqAccess<'de>>(self, mut v: A) -> Result<TypeData, A::Error> {
1118                let inverted_function_inputs_index: String =
1119                    v.next_element()?.unwrap_or(String::new());
1120                let inverted_function_output_index: String =
1121                    v.next_element()?.unwrap_or(String::new());
1122                let search_unbox: u32 = v.next_element()?.unwrap_or(0);
1123                let mut idx: Vec<u8> = Vec::new();
1124                stringdex_internals::decode::read_base64_from_bytes(
1125                    inverted_function_inputs_index.as_bytes(),
1126                    &mut idx,
1127                )
1128                .unwrap();
1129                let mut inverted_function_inputs_index = Vec::new();
1130                encode::read_postings_from_string(&mut inverted_function_inputs_index, &idx);
1131                idx.clear();
1132                stringdex_internals::decode::read_base64_from_bytes(
1133                    inverted_function_output_index.as_bytes(),
1134                    &mut idx,
1135                )
1136                .unwrap();
1137                let mut inverted_function_output_index = Vec::new();
1138                encode::read_postings_from_string(&mut inverted_function_output_index, &idx);
1139                Ok(TypeData {
1140                    inverted_function_inputs_index,
1141                    inverted_function_output_index,
1142                    search_unbox: search_unbox == 1,
1143                })
1144            }
1145        }
1146        deserializer.deserialize_any(TypeDataVisitor)
1147    }
1148}
1149
1150enum SerializedOptionalString {
1151    None,
1152    Some(String),
1153}
1154
1155impl From<SerializedOptionalString> for Option<String> {
1156    fn from(me: SerializedOptionalString) -> Option<String> {
1157        match me {
1158            SerializedOptionalString::Some(string) => Some(string),
1159            SerializedOptionalString::None => None,
1160        }
1161    }
1162}
1163
1164impl Serialize for SerializedOptionalString {
1165    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
1166    where
1167        S: Serializer,
1168    {
1169        match self {
1170            SerializedOptionalString::Some(string) => string.serialize(serializer),
1171            SerializedOptionalString::None => 0.serialize(serializer),
1172        }
1173    }
1174}
1175impl<'de> Deserialize<'de> for SerializedOptionalString {
1176    fn deserialize<D>(deserializer: D) -> Result<SerializedOptionalString, D::Error>
1177    where
1178        D: Deserializer<'de>,
1179    {
1180        struct SerializedOptionalStringVisitor;
1181        impl<'de> de::Visitor<'de> for SerializedOptionalStringVisitor {
1182            type Value = SerializedOptionalString;
1183            fn expecting(&self, formatter: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
1184                write!(formatter, "0 or string")
1185            }
1186            fn visit_u64<E: de::Error>(self, v: u64) -> Result<SerializedOptionalString, E> {
1187                if v != 0 {
1188                    return Err(E::missing_field("not 0"));
1189                }
1190                Ok(SerializedOptionalString::None)
1191            }
1192            fn visit_string<E: de::Error>(self, v: String) -> Result<SerializedOptionalString, E> {
1193                Ok(SerializedOptionalString::Some(v))
1194            }
1195            fn visit_str<E: de::Error>(self, v: &str) -> Result<SerializedOptionalString, E> {
1196                Ok(SerializedOptionalString::Some(v.to_string()))
1197            }
1198        }
1199        deserializer.deserialize_any(SerializedOptionalStringVisitor)
1200    }
1201}
1202
1203enum SerializedOptional32 {
1204    None,
1205    Some(i32),
1206}
1207
1208impl From<SerializedOptional32> for Option<i32> {
1209    fn from(me: SerializedOptional32) -> Option<i32> {
1210        match me {
1211            SerializedOptional32::Some(number) => Some(number),
1212            SerializedOptional32::None => None,
1213        }
1214    }
1215}
1216
1217impl Serialize for SerializedOptional32 {
1218    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
1219    where
1220        S: Serializer,
1221    {
1222        match self {
1223            &SerializedOptional32::Some(number) if number < 0 => number.serialize(serializer),
1224            &SerializedOptional32::Some(number) => (number + 1).serialize(serializer),
1225            &SerializedOptional32::None => 0.serialize(serializer),
1226        }
1227    }
1228}
1229impl<'de> Deserialize<'de> for SerializedOptional32 {
1230    fn deserialize<D>(deserializer: D) -> Result<SerializedOptional32, D::Error>
1231    where
1232        D: Deserializer<'de>,
1233    {
1234        struct SerializedOptional32Visitor;
1235        impl<'de> de::Visitor<'de> for SerializedOptional32Visitor {
1236            type Value = SerializedOptional32;
1237            fn expecting(&self, formatter: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
1238                write!(formatter, "integer")
1239            }
1240            fn visit_i64<E: de::Error>(self, v: i64) -> Result<SerializedOptional32, E> {
1241                Ok(match v {
1242                    0 => SerializedOptional32::None,
1243                    v if v < 0 => SerializedOptional32::Some(v as i32),
1244                    v => SerializedOptional32::Some(v as i32 - 1),
1245                })
1246            }
1247            fn visit_u64<E: de::Error>(self, v: u64) -> Result<SerializedOptional32, E> {
1248                Ok(match v {
1249                    0 => SerializedOptional32::None,
1250                    v => SerializedOptional32::Some(v as i32 - 1),
1251                })
1252            }
1253        }
1254        deserializer.deserialize_any(SerializedOptional32Visitor)
1255    }
1256}
1257
1258/// Builds the search index from the collected metadata
1259pub(crate) fn build_index(
1260    krate: &clean::Crate,
1261    cache: &mut Cache,
1262    tcx: TyCtxt<'_>,
1263    doc_root: &Path,
1264    resource_suffix: &str,
1265    should_merge: &ShouldMerge,
1266) -> Result<SerializedSearchIndex, Error> {
1267    let mut search_index = std::mem::take(&mut cache.search_index);
1268
1269    // Attach all orphan items to the type's definition if the type
1270    // has since been learned.
1271    for &OrphanImplItem { impl_id, parent, trait_parent, ref item, ref impl_generics } in
1272        &cache.orphan_impl_items
1273    {
1274        if let Some((fqp, _)) = cache.paths.get(&parent) {
1275            let info = IndexItemInfo::new(tcx, cache, item, Some(parent), impl_generics.as_ref());
1276            search_index.push(IndexItem {
1277                defid: item.item_id.as_def_id(),
1278                name: item.name.unwrap(),
1279                module_path: fqp[..fqp.len() - 1].to_vec(),
1280                parent: Some(parent),
1281                parent_idx: None,
1282                trait_parent,
1283                trait_parent_idx: None,
1284                exact_module_path: None,
1285                impl_id,
1286                info,
1287            });
1288        }
1289    }
1290
1291    // Sort search index items. This improves the compressibility of the search index.
1292    search_index.sort_unstable_by(|k1, k2| {
1293        // `sort_unstable_by_key` produces lifetime errors
1294        // HACK(rustdoc): should not be sorting `CrateNum` or `DefIndex`, this will soon go away, too
1295        fn key(i: &IndexItem) -> (&[Symbol], &str, ItemType, Option<(DefIndex, CrateNum)>) {
1296            (&i.module_path, i.name.as_str(), i.info.ty, i.parent.map(|id| (id.index, id.krate)))
1297        }
1298        Ord::cmp(&key(k1), &key(k2))
1299    });
1300
1301    // Now, convert to an on-disk search index format
1302    //
1303    // if there's already a search index, load it into memory and add the new entries to it
1304    // otherwise, do nothing
1305    let mut serialized_index = if should_merge.read_rendered_cci {
1306        SerializedSearchIndex::load(doc_root, resource_suffix)?
1307    } else {
1308        SerializedSearchIndex::default()
1309    };
1310
1311    // The crate always goes first in this list
1312    let crate_name = krate.name(tcx);
1313    let crate_doc =
1314        short_markdown_summary(&krate.module.doc_value(), &krate.module.link_names(cache));
1315    let crate_idx = {
1316        let crate_path = (ItemType::ExternCrate, vec![crate_name]);
1317        match serialized_index.crate_paths_index.entry(crate_path) {
1318            Entry::Occupied(index) => {
1319                let index = *index.get();
1320                serialized_index.descs[index] = crate_doc;
1321                for type_data in serialized_index.type_data.iter_mut() {
1322                    if let Some(TypeData {
1323                        inverted_function_inputs_index,
1324                        inverted_function_output_index,
1325                        ..
1326                    }) = type_data
1327                    {
1328                        for list in inverted_function_inputs_index
1329                            .iter_mut()
1330                            .chain(inverted_function_output_index.iter_mut())
1331                        {
1332                            list.retain(|fnid| {
1333                                serialized_index.entry_data[usize::try_from(*fnid).unwrap()]
1334                                    .as_ref()
1335                                    .unwrap()
1336                                    .krate
1337                                    != index
1338                            });
1339                        }
1340                    }
1341                }
1342                for i in (index + 1)..serialized_index.entry_data.len() {
1343                    // if this crate has been built before, replace its stuff with new
1344                    if let Some(EntryData { krate, .. }) = serialized_index.entry_data[i]
1345                        && krate == index
1346                    {
1347                        serialized_index.entry_data[i] = None;
1348                        serialized_index.descs[i] = String::new();
1349                        serialized_index.function_data[i] = None;
1350                        if serialized_index.path_data[i].is_none() {
1351                            serialized_index.names[i] = String::new();
1352                        }
1353                    }
1354                    if let Some(alias_pointer) = serialized_index.alias_pointers[i]
1355                        && serialized_index.entry_data[alias_pointer].is_none()
1356                    {
1357                        serialized_index.alias_pointers[i] = None;
1358                        if serialized_index.path_data[i].is_none()
1359                            && serialized_index.entry_data[i].is_none()
1360                        {
1361                            serialized_index.names[i] = String::new();
1362                        }
1363                    }
1364                }
1365                index
1366            }
1367            Entry::Vacant(slot) => {
1368                let krate = serialized_index.names.len();
1369                slot.insert(krate);
1370                serialized_index.push(
1371                    crate_name.as_str().to_string(),
1372                    Some(PathData {
1373                        ty: ItemType::ExternCrate,
1374                        module_path: vec![],
1375                        exact_module_path: None,
1376                    }),
1377                    Some(EntryData {
1378                        krate,
1379                        ty: ItemType::ExternCrate,
1380                        module_path: None,
1381                        exact_module_path: None,
1382                        parent: None,
1383                        trait_parent: None,
1384                        deprecated: false,
1385                        unstable: false,
1386                        associated_item_disambiguator_or_extern_crate_url: None,
1387                    }),
1388                    crate_doc,
1389                    None,
1390                    None,
1391                    None,
1392                );
1393                krate
1394            }
1395        }
1396    };
1397
1398    // First, populate associated item parents and trait parents
1399    let crate_items: Vec<&mut IndexItem> = search_index
1400        .iter_mut()
1401        .map(|item| {
1402            let mut defid_to_rowid = |defid, check_external: bool| {
1403                cache
1404                    .paths
1405                    .get(&defid)
1406                    .or_else(|| check_external.then(|| cache.external_paths.get(&defid)).flatten())
1407                    .map(|&(ref fqp, ty)| {
1408                        let pathid = serialized_index.names.len();
1409                        match serialized_index.crate_paths_index.entry((ty, fqp.clone())) {
1410                            Entry::Occupied(entry) => *entry.get(),
1411                            Entry::Vacant(entry) => {
1412                                entry.insert(pathid);
1413                                let (name, path) = fqp.split_last().unwrap();
1414                                serialized_index.push_path(
1415                                    name.as_str().to_string(),
1416                                    PathData {
1417                                        ty,
1418                                        module_path: path.to_vec(),
1419                                        exact_module_path: if let Some(exact_path) =
1420                                            cache.exact_paths.get(&defid)
1421                                            && let Some((name2, exact_path)) =
1422                                                exact_path.split_last()
1423                                            && name == name2
1424                                        {
1425                                            Some(exact_path.to_vec())
1426                                        } else {
1427                                            None
1428                                        },
1429                                    },
1430                                );
1431                                usize::try_from(pathid).unwrap()
1432                            }
1433                        }
1434                    })
1435            };
1436            item.parent_idx = item.parent.and_then(|p| defid_to_rowid(p, false));
1437            item.trait_parent_idx = item.trait_parent.and_then(|p| defid_to_rowid(p, true));
1438
1439            if let Some(defid) = item.defid
1440                && item.parent_idx.is_none()
1441            {
1442                // If this is a re-export, retain the original path.
1443                // Associated items don't use this.
1444                // Their parent carries the exact fqp instead.
1445                let exact_fqp = cache
1446                    .exact_paths
1447                    .get(&defid)
1448                    .or_else(|| cache.external_paths.get(&defid).map(|(fqp, _)| fqp));
1449                item.exact_module_path = exact_fqp.and_then(|fqp| {
1450                    // Re-exports only count if the name is exactly the same.
1451                    // This is a size optimization, since it means we only need
1452                    // to store the name once (and the path is re-used for everything
1453                    // exported from this same module). It's also likely to Do
1454                    // What I Mean, since if a re-export changes the name, it might
1455                    // also be a change in semantic meaning.
1456                    if fqp.last() != Some(&item.name) {
1457                        return None;
1458                    }
1459                    let path = if item.info.ty == ItemType::Macro
1460                        && find_attr!(tcx, defid, MacroExport { .. })
1461                    {
1462                        // `#[macro_export]` always exports to the crate root.
1463                        vec![tcx.crate_name(defid.krate)]
1464                    } else {
1465                        if fqp.len() < 2 {
1466                            return None;
1467                        }
1468                        fqp[..fqp.len() - 1].to_vec()
1469                    };
1470                    if path == item.module_path {
1471                        return None;
1472                    }
1473                    Some(path)
1474                });
1475            } else if let Some(parent_idx) = item.parent_idx {
1476                let i = usize::try_from(parent_idx).unwrap();
1477                item.module_path =
1478                    serialized_index.path_data[i].as_ref().unwrap().module_path.clone();
1479                item.exact_module_path =
1480                    serialized_index.path_data[i].as_ref().unwrap().exact_module_path.clone();
1481            }
1482
1483            &mut *item
1484        })
1485        .collect();
1486
1487    // Now, find anywhere that the same name is used for two different items
1488    // these need a disambiguator hash for lints
1489    let mut associated_item_duplicates = FxHashMap::<(usize, ItemType, Symbol), usize>::default();
1490    for item in crate_items.iter().map(|x| &*x) {
1491        if item.impl_id.is_some()
1492            && let Some(parent_idx) = item.parent_idx
1493        {
1494            let count = associated_item_duplicates
1495                .entry((parent_idx, item.info.ty, item.name))
1496                .or_insert(0);
1497            *count += 1;
1498        }
1499    }
1500
1501    // now populate the actual entries, type data, and function data
1502    for item in crate_items {
1503        assert_eq!(
1504            item.parent.is_some(),
1505            item.parent_idx.is_some(),
1506            "`{}` is missing idx",
1507            item.name
1508        );
1509
1510        let module_path = Some(serialized_index.get_id_by_module_path(&item.module_path));
1511        let exact_module_path = item
1512            .exact_module_path
1513            .as_ref()
1514            .map(|path| serialized_index.get_id_by_module_path(path));
1515
1516        let new_entry_id = serialized_index.add_entry(
1517            item.name,
1518            EntryData {
1519                ty: item.info.ty,
1520                parent: item.parent_idx,
1521                trait_parent: item.trait_parent_idx,
1522                module_path,
1523                exact_module_path,
1524                deprecated: item
1525                    .info
1526                    .deprecation
1527                    .is_some_and(|deprecation| deprecation.is_in_effect()),
1528                unstable: item.info.is_unstable,
1529                associated_item_disambiguator_or_extern_crate_url: if let Some(impl_id) =
1530                    item.impl_id
1531                    && let Some(parent_idx) = item.parent_idx
1532                    && associated_item_duplicates
1533                        .get(&(parent_idx, item.info.ty, item.name))
1534                        .copied()
1535                        .unwrap_or(0)
1536                        > 1
1537                {
1538                    Some(render::get_id_for_impl(tcx, ItemId::DefId(impl_id)))
1539                } else if item.info.ty == ItemType::ExternCrate
1540                    && let Some(local_def_id) = item.defid.and_then(|def_id| def_id.as_local())
1541                    && let cnum = tcx.extern_mod_stmt_cnum(local_def_id).unwrap_or(LOCAL_CRATE)
1542                    && let Some(ExternalLocation::Remote { url, is_absolute }) =
1543                        cache.extern_locations.get(&cnum)
1544                    && *is_absolute
1545                {
1546                    Some(format!("{}{}", url, tcx.crate_name(cnum).as_str()))
1547                } else {
1548                    None
1549                },
1550                krate: crate_idx,
1551            },
1552            item.info.desc.to_string(),
1553        );
1554
1555        // Aliases
1556        // -------
1557        for alias in &item.info.aliases {
1558            serialized_index.push_alias(alias.as_str().to_string(), new_entry_id);
1559        }
1560
1561        // Function signature reverse index
1562        // --------------------------------
1563        fn insert_into_map(
1564            ty: ItemType,
1565            path: &[Symbol],
1566            exact_path: Option<&[Symbol]>,
1567            search_unbox: bool,
1568            serialized_index: &mut SerializedSearchIndex,
1569            used_in_function_signature: &mut BTreeSet<isize>,
1570        ) -> RenderTypeId {
1571            let pathid = serialized_index.names.len();
1572            let pathid = match serialized_index.crate_paths_index.entry((ty, path.to_vec())) {
1573                Entry::Occupied(entry) => {
1574                    let id = *entry.get();
1575                    if serialized_index.type_data[id].as_mut().is_none() {
1576                        serialized_index.type_data[id] = Some(TypeData {
1577                            search_unbox,
1578                            inverted_function_inputs_index: Vec::new(),
1579                            inverted_function_output_index: Vec::new(),
1580                        });
1581                    } else if search_unbox {
1582                        serialized_index.type_data[id].as_mut().unwrap().search_unbox = true;
1583                    }
1584                    id
1585                }
1586                Entry::Vacant(entry) => {
1587                    entry.insert(pathid);
1588                    let (name, path) = path.split_last().unwrap();
1589                    serialized_index.push_type(
1590                        name.to_string(),
1591                        PathData {
1592                            ty,
1593                            module_path: path.to_vec(),
1594                            exact_module_path: if let Some(exact_path) = exact_path
1595                                && let Some((name2, exact_path)) = exact_path.split_last()
1596                                && name == name2
1597                            {
1598                                Some(exact_path.to_vec())
1599                            } else {
1600                                None
1601                            },
1602                        },
1603                        TypeData {
1604                            inverted_function_inputs_index: Vec::new(),
1605                            inverted_function_output_index: Vec::new(),
1606                            search_unbox,
1607                        },
1608                    );
1609                    pathid
1610                }
1611            };
1612            used_in_function_signature.insert(isize::try_from(pathid).unwrap());
1613            RenderTypeId::Index(isize::try_from(pathid).unwrap())
1614        }
1615
1616        fn convert_render_type_id(
1617            id: RenderTypeId,
1618            cache: &mut Cache,
1619            serialized_index: &mut SerializedSearchIndex,
1620            used_in_function_signature: &mut BTreeSet<isize>,
1621            tcx: TyCtxt<'_>,
1622        ) -> Option<RenderTypeId> {
1623            use crate::clean::PrimitiveType;
1624            let Cache { ref paths, ref external_paths, ref exact_paths, .. } = *cache;
1625            let search_unbox = match id {
1626                RenderTypeId::Mut => false,
1627                RenderTypeId::DefId(defid) => {
1628                    utils::has_doc_flag(tcx, defid, |d| d.search_unbox.is_some())
1629                }
1630                RenderTypeId::Primitive(
1631                    PrimitiveType::Reference | PrimitiveType::RawPointer | PrimitiveType::Tuple,
1632                ) => true,
1633                RenderTypeId::Primitive(..) => false,
1634                RenderTypeId::AssociatedType(..) => false,
1635                // this bool is only used by `insert_into_map`, so it doesn't matter what we set here
1636                // because Index means we've already inserted into the map
1637                RenderTypeId::Index(_) => false,
1638            };
1639            match id {
1640                RenderTypeId::Mut => Some(insert_into_map(
1641                    ItemType::Keyword,
1642                    &[kw::Mut],
1643                    None,
1644                    search_unbox,
1645                    serialized_index,
1646                    used_in_function_signature,
1647                )),
1648                RenderTypeId::DefId(defid) => {
1649                    if let Some(&(ref fqp, item_type)) =
1650                        paths.get(&defid).or_else(|| external_paths.get(&defid))
1651                    {
1652                        if tcx.lang_items().fn_mut_trait() == Some(defid)
1653                            || tcx.lang_items().fn_once_trait() == Some(defid)
1654                            || tcx.lang_items().fn_trait() == Some(defid)
1655                        {
1656                            let name = *fqp.last().unwrap();
1657                            // Make absolutely sure we use this single, correct path,
1658                            // because search.js needs to match. If we don't do this,
1659                            // there are three different paths that these traits may
1660                            // appear to come from.
1661                            Some(insert_into_map(
1662                                item_type,
1663                                &[sym::core, sym::ops, name],
1664                                Some(&[sym::core, sym::ops, name]),
1665                                search_unbox,
1666                                serialized_index,
1667                                used_in_function_signature,
1668                            ))
1669                        } else {
1670                            let exact_fqp = exact_paths
1671                                .get(&defid)
1672                                .or_else(|| external_paths.get(&defid).map(|(fqp, _)| fqp))
1673                                .map(|v| &v[..])
1674                                // Re-exports only count if the name is exactly the same.
1675                                // This is a size optimization, since it means we only need
1676                                // to store the name once (and the path is re-used for everything
1677                                // exported from this same module). It's also likely to Do
1678                                // What I Mean, since if a re-export changes the name, it might
1679                                // also be a change in semantic meaning.
1680                                .filter(|this_fqp| this_fqp.last() == fqp.last());
1681                            Some(insert_into_map(
1682                                item_type,
1683                                fqp,
1684                                exact_fqp,
1685                                search_unbox,
1686                                serialized_index,
1687                                used_in_function_signature,
1688                            ))
1689                        }
1690                    } else {
1691                        None
1692                    }
1693                }
1694                RenderTypeId::Primitive(primitive) => {
1695                    let sym = primitive.as_sym();
1696                    Some(insert_into_map(
1697                        ItemType::Primitive,
1698                        &[sym],
1699                        None,
1700                        search_unbox,
1701                        serialized_index,
1702                        used_in_function_signature,
1703                    ))
1704                }
1705                RenderTypeId::Index(index) => {
1706                    used_in_function_signature.insert(index);
1707                    Some(id)
1708                }
1709                RenderTypeId::AssociatedType(sym) => Some(insert_into_map(
1710                    ItemType::AssocType,
1711                    &[sym],
1712                    None,
1713                    search_unbox,
1714                    serialized_index,
1715                    used_in_function_signature,
1716                )),
1717            }
1718        }
1719
1720        fn convert_render_type(
1721            ty: &mut RenderType,
1722            cache: &mut Cache,
1723            serialized_index: &mut SerializedSearchIndex,
1724            used_in_function_signature: &mut BTreeSet<isize>,
1725            tcx: TyCtxt<'_>,
1726        ) {
1727            if let Some(generics) = &mut ty.generics {
1728                for item in generics {
1729                    convert_render_type(
1730                        item,
1731                        cache,
1732                        serialized_index,
1733                        used_in_function_signature,
1734                        tcx,
1735                    );
1736                }
1737            }
1738            if let Some(bindings) = &mut ty.bindings {
1739                bindings.retain_mut(|(associated_type, constraints)| {
1740                    let converted_associated_type = convert_render_type_id(
1741                        *associated_type,
1742                        cache,
1743                        serialized_index,
1744                        used_in_function_signature,
1745                        tcx,
1746                    );
1747                    let Some(converted_associated_type) = converted_associated_type else {
1748                        return false;
1749                    };
1750                    *associated_type = converted_associated_type;
1751                    for constraint in constraints {
1752                        convert_render_type(
1753                            constraint,
1754                            cache,
1755                            serialized_index,
1756                            used_in_function_signature,
1757                            tcx,
1758                        );
1759                    }
1760                    true
1761                });
1762            }
1763            let Some(id) = ty.id else {
1764                assert!(ty.generics.is_some());
1765                return;
1766            };
1767            ty.id = convert_render_type_id(
1768                id,
1769                cache,
1770                serialized_index,
1771                used_in_function_signature,
1772                tcx,
1773            );
1774            use crate::clean::PrimitiveType;
1775            // These cases are added to the inverted index, but not actually included
1776            // in the signature. There's a matching set of cases in the
1777            // `unifyFunctionTypeIsMatchCandidate` function, for the slow path.
1778            match id {
1779                // typeNameIdOfArrayOrSlice
1780                RenderTypeId::Primitive(PrimitiveType::Array | PrimitiveType::Slice) => {
1781                    insert_into_map(
1782                        ItemType::Primitive,
1783                        &[Symbol::intern("[]")],
1784                        None,
1785                        false,
1786                        serialized_index,
1787                        used_in_function_signature,
1788                    );
1789                }
1790                RenderTypeId::Primitive(PrimitiveType::Tuple | PrimitiveType::Unit) => {
1791                    // typeNameIdOfArrayOrSlice
1792                    insert_into_map(
1793                        ItemType::Primitive,
1794                        &[Symbol::intern("()")],
1795                        None,
1796                        false,
1797                        serialized_index,
1798                        used_in_function_signature,
1799                    );
1800                }
1801                // typeNameIdOfHof
1802                RenderTypeId::Primitive(PrimitiveType::Fn) => {
1803                    insert_into_map(
1804                        ItemType::Primitive,
1805                        &[Symbol::intern("->")],
1806                        None,
1807                        false,
1808                        serialized_index,
1809                        used_in_function_signature,
1810                    );
1811                }
1812                RenderTypeId::DefId(did)
1813                    if tcx.lang_items().fn_mut_trait() == Some(did)
1814                        || tcx.lang_items().fn_once_trait() == Some(did)
1815                        || tcx.lang_items().fn_trait() == Some(did) =>
1816                {
1817                    insert_into_map(
1818                        ItemType::Primitive,
1819                        &[Symbol::intern("->")],
1820                        None,
1821                        false,
1822                        serialized_index,
1823                        used_in_function_signature,
1824                    );
1825                }
1826                // not special
1827                _ => {}
1828            }
1829        }
1830        if let Some(search_type) = &mut item.info.search_type {
1831            let mut used_in_function_inputs = BTreeSet::new();
1832            let mut used_in_function_output = BTreeSet::new();
1833            for item in &mut search_type.inputs {
1834                convert_render_type(
1835                    item,
1836                    cache,
1837                    &mut serialized_index,
1838                    &mut used_in_function_inputs,
1839                    tcx,
1840                );
1841            }
1842            for item in &mut search_type.output {
1843                convert_render_type(
1844                    item,
1845                    cache,
1846                    &mut serialized_index,
1847                    &mut used_in_function_output,
1848                    tcx,
1849                );
1850            }
1851            let used_in_constraints = search_type
1852                .where_clause
1853                .iter_mut()
1854                .map(|constraint| {
1855                    let mut used_in_constraint = BTreeSet::new();
1856                    for trait_ in constraint {
1857                        convert_render_type(
1858                            trait_,
1859                            cache,
1860                            &mut serialized_index,
1861                            &mut used_in_constraint,
1862                            tcx,
1863                        );
1864                    }
1865                    used_in_constraint
1866                })
1867                .collect::<Vec<_>>();
1868            loop {
1869                let mut inserted_any = false;
1870                for (i, used_in_constraint) in used_in_constraints.iter().enumerate() {
1871                    let id = !(i as isize);
1872                    if used_in_function_inputs.contains(&id)
1873                        && !used_in_function_inputs.is_superset(&used_in_constraint)
1874                    {
1875                        used_in_function_inputs.extend(used_in_constraint.iter().copied());
1876                        inserted_any = true;
1877                    }
1878                    if used_in_function_output.contains(&id)
1879                        && !used_in_function_output.is_superset(&used_in_constraint)
1880                    {
1881                        used_in_function_output.extend(used_in_constraint.iter().copied());
1882                        inserted_any = true;
1883                    }
1884                }
1885                if !inserted_any {
1886                    break;
1887                }
1888            }
1889            let search_type_size = search_type.size() +
1890                // Artificially give struct fields a size of 8 instead of their real
1891                // size of 2. This is because search.js sorts them to the end, so
1892                // by pushing them down, we prevent them from blocking real 2-arity functions.
1893                //
1894                // The number 8 is arbitrary. We want it big, but not enormous,
1895                // because the postings list has to fill in an empty array for each
1896                // unoccupied size.
1897                if item.info.ty.is_fn_like() { 0 } else { 16 };
1898            serialized_index.function_data[new_entry_id] = Some(search_type.clone());
1899
1900            #[derive(Clone, Copy)]
1901            enum InvertedIndexType {
1902                Inputs,
1903                Output,
1904            }
1905            impl InvertedIndexType {
1906                fn from_type_data(self, type_data: &mut TypeData) -> &mut Vec<Vec<u32>> {
1907                    match self {
1908                        Self::Inputs => &mut type_data.inverted_function_inputs_index,
1909                        Self::Output => &mut type_data.inverted_function_output_index,
1910                    }
1911                }
1912            }
1913
1914            let mut process_used_in_function =
1915                |used_in_function: BTreeSet<isize>, index_type: InvertedIndexType| {
1916                    for index in used_in_function {
1917                        let postings = if index >= 0 {
1918                            assert!(serialized_index.path_data[index as usize].is_some());
1919                            index_type.from_type_data(
1920                                serialized_index.type_data[index as usize].as_mut().unwrap(),
1921                            )
1922                        } else {
1923                            let generic_id = index.unsigned_abs() - 1;
1924                            if generic_id >= serialized_index.generic_inverted_index.len() {
1925                                serialized_index
1926                                    .generic_inverted_index
1927                                    .resize(generic_id + 1, Vec::new());
1928                            }
1929                            &mut serialized_index.generic_inverted_index[generic_id]
1930                        };
1931                        if search_type_size >= postings.len() {
1932                            postings.resize(search_type_size + 1, Vec::new());
1933                        }
1934                        let posting = &mut postings[search_type_size];
1935                        if posting.last() != Some(&(new_entry_id as u32)) {
1936                            posting.push(new_entry_id as u32);
1937                        }
1938                    }
1939                };
1940
1941            process_used_in_function(used_in_function_inputs, InvertedIndexType::Inputs);
1942            process_used_in_function(used_in_function_output, InvertedIndexType::Output);
1943        }
1944    }
1945
1946    Ok(serialized_index.sort())
1947}
1948
1949pub(crate) fn get_function_type_for_search(
1950    item: &clean::Item,
1951    tcx: TyCtxt<'_>,
1952    impl_generics: Option<&(clean::Type, clean::Generics)>,
1953    parent: Option<DefId>,
1954    cache: &Cache,
1955) -> Option<IndexItemFunctionType> {
1956    let mut trait_info = None;
1957    let impl_or_trait_generics = impl_generics.or_else(|| {
1958        if let Some(def_id) = parent
1959            && let Some(trait_) = cache.traits.get(&def_id)
1960            && let Some((path, _)) =
1961                cache.paths.get(&def_id).or_else(|| cache.external_paths.get(&def_id))
1962        {
1963            let path = clean::Path {
1964                res: rustc_hir::def::Res::Def(rustc_hir::def::DefKind::Trait, def_id),
1965                segments: path
1966                    .iter()
1967                    .map(|name| clean::PathSegment {
1968                        name: *name,
1969                        args: clean::GenericArgs::AngleBracketed {
1970                            args: ThinVec::new(),
1971                            constraints: ThinVec::new(),
1972                        },
1973                    })
1974                    .collect(),
1975            };
1976            trait_info = Some((clean::Type::Path { path }, trait_.generics.clone()));
1977            Some(trait_info.as_ref().unwrap())
1978        } else {
1979            None
1980        }
1981    });
1982    let (mut inputs, mut output, param_names, where_clause) = match item.kind {
1983        clean::ForeignFunctionItem(ref f, _)
1984        | clean::FunctionItem(ref f)
1985        | clean::MethodItem(ref f, _)
1986        | clean::RequiredMethodItem(ref f, _) => {
1987            get_fn_inputs_and_outputs(f, tcx, impl_or_trait_generics, cache)
1988        }
1989        clean::ConstantItem(ref c) => make_nullary_fn(&c.type_),
1990        clean::StaticItem(ref s) => make_nullary_fn(&s.type_),
1991        clean::StructFieldItem(ref t) if let Some(parent) = parent => {
1992            let mut rgen: FxIndexMap<SimplifiedParam, (isize, Vec<RenderType>)> =
1993                Default::default();
1994            let output = get_index_type(t, vec![], &mut rgen);
1995            let input = RenderType {
1996                id: Some(RenderTypeId::DefId(parent)),
1997                generics: None,
1998                bindings: None,
1999            };
2000            (vec![input], vec![output], vec![], vec![])
2001        }
2002        _ => return None,
2003    };
2004
2005    inputs.retain(|a| a.id.is_some() || a.generics.is_some());
2006    output.retain(|a| a.id.is_some() || a.generics.is_some());
2007
2008    Some(IndexItemFunctionType { inputs, output, where_clause, param_names })
2009}
2010
2011fn get_index_type(
2012    clean_type: &clean::Type,
2013    generics: Vec<RenderType>,
2014    rgen: &mut FxIndexMap<SimplifiedParam, (isize, Vec<RenderType>)>,
2015) -> RenderType {
2016    RenderType {
2017        id: get_index_type_id(clean_type, rgen),
2018        generics: if generics.is_empty() { None } else { Some(generics) },
2019        bindings: None,
2020    }
2021}
2022
2023fn get_index_type_id(
2024    clean_type: &clean::Type,
2025    rgen: &mut FxIndexMap<SimplifiedParam, (isize, Vec<RenderType>)>,
2026) -> Option<RenderTypeId> {
2027    use rustc_hir::def::{DefKind, Res};
2028    match *clean_type {
2029        clean::Type::Path { ref path, .. } => Some(RenderTypeId::DefId(path.def_id())),
2030        clean::DynTrait(ref bounds, _) => {
2031            bounds.first().map(|b| RenderTypeId::DefId(b.trait_.def_id()))
2032        }
2033        clean::Primitive(p) => Some(RenderTypeId::Primitive(p)),
2034        clean::BorrowedRef { .. } => Some(RenderTypeId::Primitive(clean::PrimitiveType::Reference)),
2035        clean::RawPointer { .. } => Some(RenderTypeId::Primitive(clean::PrimitiveType::RawPointer)),
2036        // The type parameters are converted to generics in `simplify_fn_type`
2037        clean::Slice(_) => Some(RenderTypeId::Primitive(clean::PrimitiveType::Slice)),
2038        clean::Array(_, _) => Some(RenderTypeId::Primitive(clean::PrimitiveType::Array)),
2039        clean::BareFunction(_) => Some(RenderTypeId::Primitive(clean::PrimitiveType::Fn)),
2040        clean::Tuple(ref n) if n.is_empty() => {
2041            Some(RenderTypeId::Primitive(clean::PrimitiveType::Unit))
2042        }
2043        clean::Tuple(_) => Some(RenderTypeId::Primitive(clean::PrimitiveType::Tuple)),
2044        clean::QPath(ref data) => {
2045            if data.self_type.is_self_type()
2046                && let Some(clean::Path { res: Res::Def(DefKind::Trait, trait_), .. }) = data.trait_
2047            {
2048                let idx = -isize::try_from(rgen.len() + 1).unwrap();
2049                let (idx, _) = rgen
2050                    .entry(SimplifiedParam::AssociatedType(trait_, data.assoc.name))
2051                    .or_insert_with(|| (idx, Vec::new()));
2052                Some(RenderTypeId::Index(*idx))
2053            } else {
2054                None
2055            }
2056        }
2057        // Not supported yet
2058        clean::Type::Pat(..)
2059        | clean::Type::FieldOf(..)
2060        | clean::Generic(_)
2061        | clean::SelfTy
2062        | clean::ImplTrait(_)
2063        | clean::Infer
2064        | clean::UnsafeBinder(_) => None,
2065    }
2066}
2067
2068#[derive(Clone, Copy, Eq, Hash, PartialEq)]
2069enum SimplifiedParam {
2070    // other kinds of type parameters are identified by their name
2071    Symbol(Symbol),
2072    // every argument-position impl trait is its own type parameter
2073    Anonymous(isize),
2074    // in a trait definition, the associated types are all bound to
2075    // their own type parameter
2076    AssociatedType(DefId, Symbol),
2077}
2078
2079/// The point of this function is to lower generics and types into the simplified form that the
2080/// frontend search engine can use.
2081///
2082/// For example, `[T, U, i32]]` where you have the bounds: `T: Display, U: Option<T>` will return
2083/// `[-1, -2, i32] where -1: Display, -2: Option<-1>`. If a type parameter has no trait bound, it
2084/// will still get a number. If a constraint is present but not used in the actual types, it will
2085/// not be added to the map.
2086///
2087/// This function also works recursively.
2088#[instrument(level = "trace", skip(tcx, rgen, cache))]
2089fn simplify_fn_type<'a, 'tcx>(
2090    self_: Option<&'a Type>,
2091    generics: &Generics,
2092    arg: &'a Type,
2093    tcx: TyCtxt<'tcx>,
2094    recurse: usize,
2095    rgen: &mut FxIndexMap<SimplifiedParam, (isize, Vec<RenderType>)>,
2096    is_return: bool,
2097    cache: &Cache,
2098) -> Option<RenderType> {
2099    if recurse >= 10 {
2100        // FIXME: remove this whole recurse thing when the recursion bug is fixed
2101        // See #59502 for the original issue.
2102        return None;
2103    }
2104
2105    // First, check if it's "Self".
2106    let (is_self, arg) = if let Some(self_) = self_
2107        && arg.is_self_type()
2108    {
2109        (true, self_)
2110    } else {
2111        (false, arg)
2112    };
2113
2114    // If this argument is a type parameter and not a trait bound or a type, we need to look
2115    // for its bounds.
2116    match *arg {
2117        Type::Generic(arg_s) => {
2118            // First we check if the bounds are in a `where` predicate...
2119            let where_bounds = generics
2120                .where_predicates
2121                .iter()
2122                .filter_map(|g| {
2123                    if let WherePredicate::BoundPredicate { ty, bounds, .. } = g
2124                        && *ty == *arg
2125                    {
2126                        Some(bounds)
2127                    } else {
2128                        None
2129                    }
2130                })
2131                .flatten();
2132            // Otherwise we check if the trait bounds are "inlined" like `T: Option<u32>`...
2133            let inline_bounds = generics
2134                .params
2135                .iter()
2136                .find(|g| g.is_type() && g.name == arg_s)
2137                .and_then(|bound| bound.get_bounds())
2138                .into_iter()
2139                .flatten();
2140
2141            let type_bounds = where_bounds
2142                .chain(inline_bounds)
2143                .filter_map(
2144                    |bound| if let Some(path) = bound.get_trait_path() { Some(path) } else { None },
2145                )
2146                .filter_map(|path| {
2147                    let ty = Type::Path { path };
2148                    simplify_fn_type(self_, generics, &ty, tcx, recurse + 1, rgen, is_return, cache)
2149                })
2150                .collect();
2151
2152            Some(if let Some((idx, _)) = rgen.get(&SimplifiedParam::Symbol(arg_s)) {
2153                RenderType { id: Some(RenderTypeId::Index(*idx)), generics: None, bindings: None }
2154            } else {
2155                let idx = -isize::try_from(rgen.len() + 1).unwrap();
2156                rgen.insert(SimplifiedParam::Symbol(arg_s), (idx, type_bounds));
2157                RenderType { id: Some(RenderTypeId::Index(idx)), generics: None, bindings: None }
2158            })
2159        }
2160        Type::ImplTrait(ref bounds) => {
2161            let type_bounds = bounds
2162                .iter()
2163                .filter_map(|bound| bound.get_trait_path())
2164                .filter_map(|path| {
2165                    let ty = Type::Path { path };
2166                    simplify_fn_type(self_, generics, &ty, tcx, recurse + 1, rgen, is_return, cache)
2167                })
2168                .collect::<Vec<_>>();
2169            Some(if is_return && !type_bounds.is_empty() {
2170                // In return position, `impl Trait` is a unique thing.
2171                RenderType { id: None, generics: Some(type_bounds), bindings: None }
2172            } else {
2173                // In parameter position, `impl Trait` is the same as an unnamed generic parameter.
2174                let idx = -isize::try_from(rgen.len() + 1).unwrap();
2175                rgen.insert(SimplifiedParam::Anonymous(idx), (idx, type_bounds));
2176                RenderType { id: Some(RenderTypeId::Index(idx)), generics: None, bindings: None }
2177            })
2178        }
2179        Type::Slice(ref ty) => {
2180            let ty_generics =
2181                simplify_fn_type(self_, generics, ty, tcx, recurse + 1, rgen, is_return, cache)
2182                    .into_iter()
2183                    .collect();
2184            Some(get_index_type(arg, ty_generics, rgen))
2185        }
2186        Type::Array(ref ty, _) => {
2187            let ty_generics =
2188                simplify_fn_type(self_, generics, ty, tcx, recurse + 1, rgen, is_return, cache)
2189                    .into_iter()
2190                    .collect();
2191            Some(get_index_type(arg, ty_generics, rgen))
2192        }
2193        Type::Tuple(ref tys) => {
2194            let ty_generics = tys
2195                .iter()
2196                .filter_map(|ty| {
2197                    simplify_fn_type(self_, generics, ty, tcx, recurse + 1, rgen, is_return, cache)
2198                })
2199                .collect();
2200            Some(get_index_type(arg, ty_generics, rgen))
2201        }
2202        Type::BareFunction(ref bf) => {
2203            let ty_generics = bf
2204                .decl
2205                .inputs
2206                .iter()
2207                .map(|arg| &arg.type_)
2208                .filter_map(|ty| {
2209                    simplify_fn_type(self_, generics, ty, tcx, recurse + 1, rgen, is_return, cache)
2210                })
2211                .collect();
2212            // The search index, for simplicity's sake, represents fn pointers and closures
2213            // the same way: as a tuple for the parameters, and an associated type for the
2214            // return type.
2215            let ty_output = simplify_fn_type(
2216                self_,
2217                generics,
2218                &bf.decl.output,
2219                tcx,
2220                recurse + 1,
2221                rgen,
2222                is_return,
2223                cache,
2224            )
2225            .into_iter()
2226            .collect();
2227            let ty_bindings = vec![(RenderTypeId::AssociatedType(sym::Output), ty_output)];
2228            Some(RenderType {
2229                id: get_index_type_id(arg, rgen),
2230                bindings: Some(ty_bindings),
2231                generics: Some(ty_generics),
2232            })
2233        }
2234        Type::BorrowedRef { lifetime: _, mutability, ref type_ }
2235        | Type::RawPointer(mutability, ref type_) => {
2236            let mut ty_generics = Vec::new();
2237            if mutability.is_mut() {
2238                ty_generics.push(RenderType {
2239                    id: Some(RenderTypeId::Mut),
2240                    generics: None,
2241                    bindings: None,
2242                });
2243            }
2244            if let Some(ty) =
2245                simplify_fn_type(self_, generics, type_, tcx, recurse + 1, rgen, is_return, cache)
2246            {
2247                ty_generics.push(ty);
2248            }
2249            Some(get_index_type(arg, ty_generics, rgen))
2250        }
2251        _ => {
2252            // This is not a type parameter. So for example if we have `T, U: Option<T>`, and we're
2253            // looking at `Option`, we enter this "else" condition, otherwise if it's `T`, we don't.
2254            //
2255            // So in here, we can add it directly and look for its own type parameters (so for `Option`,
2256            // we will look for them but not for `T`).
2257            let mut ty_generics = Vec::new();
2258            let mut ty_constraints = Vec::new();
2259            if let Some(arg_generics) = arg.generic_args() {
2260                ty_generics = arg_generics
2261                    .into_iter()
2262                    .filter_map(|param| match param {
2263                        clean::GenericArg::Type(ty) => Some(ty),
2264                        _ => None,
2265                    })
2266                    .filter_map(|ty| {
2267                        simplify_fn_type(
2268                            self_,
2269                            generics,
2270                            &ty,
2271                            tcx,
2272                            recurse + 1,
2273                            rgen,
2274                            is_return,
2275                            cache,
2276                        )
2277                    })
2278                    .collect();
2279                for constraint in arg_generics.constraints() {
2280                    simplify_fn_constraint(
2281                        self_,
2282                        generics,
2283                        &constraint,
2284                        tcx,
2285                        recurse + 1,
2286                        &mut ty_constraints,
2287                        rgen,
2288                        is_return,
2289                        cache,
2290                    );
2291                }
2292            }
2293            // Every trait associated type on self gets assigned to a type parameter index
2294            // this same one is used later for any appearances of these types
2295            //
2296            // for example, Iterator::next is:
2297            //
2298            //     trait Iterator {
2299            //         fn next(&mut self) -> Option<Self::Item>
2300            //     }
2301            //
2302            // Self is technically just Iterator, but we want to pretend it's more like this:
2303            //
2304            //     fn next<T>(self: Iterator<Item=T>) -> Option<T>
2305            if is_self
2306                && let Type::Path { path } = arg
2307                && let def_id = path.def_id()
2308                && let Some(trait_) = cache.traits.get(&def_id)
2309                && trait_.items.iter().any(|at| at.is_required_associated_type())
2310            {
2311                for assoc_ty in &trait_.items {
2312                    if let clean::ItemKind::RequiredAssocTypeItem(_generics, bounds) =
2313                        &assoc_ty.kind
2314                        && let Some(name) = assoc_ty.name
2315                    {
2316                        let idx = -isize::try_from(rgen.len() + 1).unwrap();
2317                        let (idx, stored_bounds) = rgen
2318                            .entry(SimplifiedParam::AssociatedType(def_id, name))
2319                            .or_insert_with(|| (idx, Vec::new()));
2320                        let idx = *idx;
2321                        if stored_bounds.is_empty() {
2322                            // Can't just pass stored_bounds to simplify_fn_type,
2323                            // because it also accepts rgen as a parameter.
2324                            // Instead, have it fill in this local, then copy it into the map afterward.
2325                            let type_bounds = bounds
2326                                .iter()
2327                                .filter_map(|bound| bound.get_trait_path())
2328                                .filter_map(|path| {
2329                                    let ty = Type::Path { path };
2330                                    simplify_fn_type(
2331                                        self_,
2332                                        generics,
2333                                        &ty,
2334                                        tcx,
2335                                        recurse + 1,
2336                                        rgen,
2337                                        is_return,
2338                                        cache,
2339                                    )
2340                                })
2341                                .collect();
2342                            let stored_bounds = &mut rgen
2343                                .get_mut(&SimplifiedParam::AssociatedType(def_id, name))
2344                                .unwrap()
2345                                .1;
2346                            if stored_bounds.is_empty() {
2347                                *stored_bounds = type_bounds;
2348                            }
2349                        }
2350                        ty_constraints.push((
2351                            RenderTypeId::AssociatedType(name),
2352                            vec![RenderType {
2353                                id: Some(RenderTypeId::Index(idx)),
2354                                generics: None,
2355                                bindings: None,
2356                            }],
2357                        ))
2358                    }
2359                }
2360            }
2361            let id = get_index_type_id(arg, rgen);
2362            if id.is_some() || !ty_generics.is_empty() {
2363                Some(RenderType {
2364                    id,
2365                    bindings: if ty_constraints.is_empty() { None } else { Some(ty_constraints) },
2366                    generics: if ty_generics.is_empty() { None } else { Some(ty_generics) },
2367                })
2368            } else {
2369                None
2370            }
2371        }
2372    }
2373}
2374
2375fn simplify_fn_constraint<'a>(
2376    self_: Option<&'a Type>,
2377    generics: &Generics,
2378    constraint: &'a clean::AssocItemConstraint,
2379    tcx: TyCtxt<'_>,
2380    recurse: usize,
2381    res: &mut Vec<(RenderTypeId, Vec<RenderType>)>,
2382    rgen: &mut FxIndexMap<SimplifiedParam, (isize, Vec<RenderType>)>,
2383    is_return: bool,
2384    cache: &Cache,
2385) {
2386    let mut ty_constraints = Vec::new();
2387    let ty_constrained_assoc = RenderTypeId::AssociatedType(constraint.assoc.name);
2388    for param in &constraint.assoc.args {
2389        match param {
2390            clean::GenericArg::Type(arg) => {
2391                ty_constraints.extend(simplify_fn_type(
2392                    self_,
2393                    generics,
2394                    &arg,
2395                    tcx,
2396                    recurse + 1,
2397                    rgen,
2398                    is_return,
2399                    cache,
2400                ));
2401            }
2402            clean::GenericArg::Lifetime(_)
2403            | clean::GenericArg::Const(_)
2404            | clean::GenericArg::Infer => {}
2405        }
2406    }
2407    for constraint in constraint.assoc.args.constraints() {
2408        simplify_fn_constraint(
2409            self_,
2410            generics,
2411            &constraint,
2412            tcx,
2413            recurse + 1,
2414            res,
2415            rgen,
2416            is_return,
2417            cache,
2418        );
2419    }
2420    match &constraint.kind {
2421        clean::AssocItemConstraintKind::Equality { term } => {
2422            if let clean::Term::Type(arg) = &term {
2423                ty_constraints.extend(simplify_fn_type(
2424                    self_,
2425                    generics,
2426                    arg,
2427                    tcx,
2428                    recurse + 1,
2429                    rgen,
2430                    is_return,
2431                    cache,
2432                ));
2433            }
2434        }
2435        clean::AssocItemConstraintKind::Bound { bounds } => {
2436            for bound in &bounds[..] {
2437                if let Some(path) = bound.get_trait_path() {
2438                    let ty = Type::Path { path };
2439                    ty_constraints.extend(simplify_fn_type(
2440                        self_,
2441                        generics,
2442                        &ty,
2443                        tcx,
2444                        recurse + 1,
2445                        rgen,
2446                        is_return,
2447                        cache,
2448                    ));
2449                }
2450            }
2451        }
2452    }
2453    res.push((ty_constrained_assoc, ty_constraints));
2454}
2455
2456/// Create a fake nullary function.
2457///
2458/// Used to allow type-based search on constants and statics.
2459fn make_nullary_fn(
2460    clean_type: &clean::Type,
2461) -> (Vec<RenderType>, Vec<RenderType>, Vec<Option<Symbol>>, Vec<Vec<RenderType>>) {
2462    let mut rgen: FxIndexMap<SimplifiedParam, (isize, Vec<RenderType>)> = Default::default();
2463    let output = get_index_type(clean_type, vec![], &mut rgen);
2464    (vec![], vec![output], vec![], vec![])
2465}
2466
2467/// Return the full list of types when bounds have been resolved.
2468///
2469/// i.e. `fn foo<A: Display, B: Option<A>>(x: u32, y: B)` will return
2470/// `[u32, Display, Option]`.
2471fn get_fn_inputs_and_outputs(
2472    func: &Function,
2473    tcx: TyCtxt<'_>,
2474    impl_or_trait_generics: Option<&(clean::Type, clean::Generics)>,
2475    cache: &Cache,
2476) -> (Vec<RenderType>, Vec<RenderType>, Vec<Option<Symbol>>, Vec<Vec<RenderType>>) {
2477    let decl = &func.decl;
2478
2479    let mut rgen: FxIndexMap<SimplifiedParam, (isize, Vec<RenderType>)> = Default::default();
2480
2481    let combined_generics;
2482    let (self_, generics) = if let Some((impl_self, impl_generics)) = impl_or_trait_generics {
2483        match (impl_generics.is_empty(), func.generics.is_empty()) {
2484            (true, _) => (Some(impl_self), &func.generics),
2485            (_, true) => (Some(impl_self), impl_generics),
2486            (false, false) => {
2487                let params =
2488                    func.generics.params.iter().chain(&impl_generics.params).cloned().collect();
2489                let where_predicates = func
2490                    .generics
2491                    .where_predicates
2492                    .iter()
2493                    .chain(&impl_generics.where_predicates)
2494                    .cloned()
2495                    .collect();
2496                combined_generics = clean::Generics { params, where_predicates };
2497                (Some(impl_self), &combined_generics)
2498            }
2499        }
2500    } else {
2501        (None, &func.generics)
2502    };
2503
2504    let param_types = decl
2505        .inputs
2506        .iter()
2507        .filter_map(|param| {
2508            simplify_fn_type(self_, generics, &param.type_, tcx, 0, &mut rgen, false, cache)
2509        })
2510        .collect();
2511
2512    let ret_types = simplify_fn_type(self_, generics, &decl.output, tcx, 0, &mut rgen, true, cache)
2513        .into_iter()
2514        .collect();
2515
2516    let mut simplified_params = rgen.into_iter().collect::<Vec<_>>();
2517    simplified_params.sort_by_key(|(_, (idx, _))| -idx);
2518    (
2519        param_types,
2520        ret_types,
2521        simplified_params
2522            .iter()
2523            .map(|(name, (_idx, _traits))| match name {
2524                SimplifiedParam::Symbol(name) => Some(*name),
2525                SimplifiedParam::Anonymous(_) => None,
2526                SimplifiedParam::AssociatedType(def_id, name) => {
2527                    Some(Symbol::intern(&format!("{}::{}", tcx.item_name(*def_id), name)))
2528                }
2529            })
2530            .collect(),
2531        simplified_params.into_iter().map(|(_name, (_idx, traits))| traits).collect(),
2532    )
2533}