//! Proc macro which builds the Symbol table //! //! # Debugging //! //! Since this proc-macro does some non-trivial work, debugging it is important. //! This proc-macro can be invoked as an ordinary unit test, like so: //! //! ```bash //! cd compiler/rustc_macros //! cargo test symbols::test_symbols -- --nocapture //! ``` //! //! This unit test finds the `symbols!` invocation in `compiler/rustc_span/src/symbol.rs` //! and runs it. It verifies that the output token stream can be parsed as valid module //! items and that no errors were produced. //! //! You can also view the generated code by using `cargo expand`: //! //! ```bash //! cargo install cargo-expand # this is necessary only once //! cd compiler/rustc_span //! cargo expand > /tmp/rustc_span.rs # it's a big file //! ``` use proc_macro2::{Span, TokenStream}; use quote::quote; use std::collections::HashMap; use syn::parse::{Parse, ParseStream, Result}; use syn::{braced, punctuated::Punctuated, Ident, LitStr, Token}; #[cfg(test)] mod tests; mod kw { syn::custom_keyword!(Keywords); syn::custom_keyword!(Symbols); } struct Keyword { name: Ident, value: LitStr, } impl Parse for Keyword { fn parse(input: ParseStream<'_>) -> Result { let name = input.parse()?; input.parse::()?; let value = input.parse()?; Ok(Keyword { name, value }) } } struct Symbol { name: Ident, value: Value, } enum Value { SameAsName, String(LitStr), } impl Parse for Symbol { fn parse(input: ParseStream<'_>) -> Result { let name = input.parse()?; let colon_token: Option = input.parse()?; let value = if colon_token.is_some() { input.parse()? } else { Value::SameAsName }; Ok(Symbol { name, value }) } } impl Parse for Value { fn parse(input: ParseStream<'_>) -> Result { let lit: LitStr = input.parse()?; Ok(Value::String(lit)) } } struct Input { keywords: Punctuated, symbols: Punctuated, } impl Parse for Input { fn parse(input: ParseStream<'_>) -> Result { input.parse::()?; let content; braced!(content in input); let keywords = Punctuated::parse_terminated(&content)?; input.parse::()?; let content; braced!(content in input); let symbols = Punctuated::parse_terminated(&content)?; Ok(Input { keywords, symbols }) } } #[derive(Default)] struct Errors { list: Vec, } impl Errors { fn error(&mut self, span: Span, message: String) { self.list.push(syn::Error::new(span, message)); } } pub fn symbols(input: TokenStream) -> TokenStream { let (mut output, errors) = symbols_with_errors(input); // If we generated any errors, then report them as compiler_error!() macro calls. // This lets the errors point back to the most relevant span. It also allows us // to report as many errors as we can during a single run. output.extend(errors.into_iter().map(|e| e.to_compile_error())); output } struct Preinterned { idx: u32, span_of_name: Span, } fn symbols_with_errors(input: TokenStream) -> (TokenStream, Vec) { let mut errors = Errors::default(); let input: Input = match syn::parse2(input) { Ok(input) => input, Err(e) => { // This allows us to display errors at the proper span, while minimizing // unrelated errors caused by bailing out (and not generating code). errors.list.push(e); Input { keywords: Default::default(), symbols: Default::default() } } }; let mut keyword_stream = quote! {}; let mut symbols_stream = quote! {}; let mut prefill_stream = quote! {}; let mut entries = HashMap::::with_capacity( input.keywords.len() + input.symbols.len() + 10, ); let mut prev_key: Option<(Span, String)> = None; let mut insert = |span: Span, str: &str, errors: &mut Errors| -> u32 { if let Some(prev) = entries.get(str) { errors.error(span, format!("Symbol `{str}` is duplicated")); errors.error(prev.span_of_name, "location of previous definition".to_string()); prev.idx } else { let idx = u32::try_from(entries.len()).expect("way too many symbols"); entries.insert(str.to_string(), Preinterned { idx, span_of_name: span }); idx } }; let mut check_order = |span: Span, str: &str, errors: &mut Errors| { if let Some((prev_span, ref prev_str)) = prev_key { if str < prev_str { errors.error(span, format!("Symbol `{str}` must precede `{prev_str}`")); errors.error(prev_span, format!("location of previous symbol `{prev_str}`")); } } prev_key = Some((span, str.to_string())); }; // Generate the listed keywords. for keyword in input.keywords.iter() { let name = &keyword.name; let value = &keyword.value; let value_string = value.value(); let idx = insert(keyword.name.span(), &value_string, &mut errors); prefill_stream.extend(quote! { #value, }); keyword_stream.extend(quote! { pub const #name: Symbol = Symbol::new(#idx); }); } // Generate the listed symbols. for symbol in input.symbols.iter() { let name = &symbol.name; let value = match &symbol.value { Value::SameAsName => name.to_string(), Value::String(lit) => lit.value(), }; let idx = insert(symbol.name.span(), &value, &mut errors); check_order(symbol.name.span(), &name.to_string(), &mut errors); prefill_stream.extend(quote! { #value, }); symbols_stream.extend(quote! { pub const #name: Symbol = Symbol::new(#idx); }); } // Generate symbols for the strings "0", "1", ..., "9". for n in 0..10 { let n = n.to_string(); insert(Span::call_site(), &n, &mut errors); prefill_stream.extend(quote! { #n, }); } let symbol_digits_base = entries["0"].idx; let preinterned_symbols_count = u32::try_from(entries.len()).expect("way too many symbols"); let output = quote! { const SYMBOL_DIGITS_BASE: u32 = #symbol_digits_base; const PREINTERNED_SYMBOLS_COUNT: u32 = #preinterned_symbols_count; #[doc(hidden)] #[allow(non_upper_case_globals)] mod kw_generated { use super::Symbol; #keyword_stream } #[allow(non_upper_case_globals)] #[doc(hidden)] pub mod sym_generated { use super::Symbol; #symbols_stream } impl Interner { pub(crate) fn fresh() -> Self { Interner::prefill(&[ #prefill_stream ]) } } }; (output, errors.list) // To see the generated code, use the "cargo expand" command. // Do this once to install: // cargo install cargo-expand // // Then, cd to rustc_span and run: // cargo expand > /tmp/rustc_span_expanded.rs // // and read that file. }