aboutsummaryrefslogtreecommitdiff
path: root/tools/src/bin/gen.rs
blob: e772922baa330a54f933b37c6e951636811ef015 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
extern crate serde;
#[macro_use]
extern crate serde_derive;

extern crate file;
extern crate ron;

use std::path::PathBuf;
use std::fmt::Write;

fn main() {
    let grammar = Grammar::read();
    let text = grammar.to_syntax_kinds();
    let target = generated_file();
    if text != file::get_text(&target).unwrap_or_default() {
        file::put_text(&target, &text).unwrap();
    }
}

#[derive(Deserialize)]
struct Grammar {
    keywords: Vec<String>,
    contextual_keywords: Vec<String>,
    tokens: Vec<String>,
    nodes: Vec<String>,
}

impl Grammar {
    fn read() -> Grammar {
        let text = file::get_text(&grammar_file()).unwrap();
        ron::de::from_str(&text).unwrap()
    }

    fn to_syntax_kinds(&self) -> String {
        let mut acc = String::new();
        acc.push_str("#![allow(bad_style, missing_docs, unreachable_pub)]\n");
        acc.push_str("#![cfg_attr(rustfmt, rustfmt_skip)]\n");
        acc.push_str("//! Generated from grammar.ron\n");
        acc.push_str("use super::SyntaxInfo;\n");
        acc.push_str("\n");

        let syntax_kinds: Vec<String> = self.tokens
            .iter()
            .cloned()
            .chain(self.keywords.iter().map(|kw| kw_token(kw)))
            .chain(self.contextual_keywords.iter().map(|kw| kw_token(kw)))
            .chain(self.nodes.iter().cloned())
            .collect();

        // enum SyntaxKind
        acc.push_str("/// The kind of syntax node, e.g. `IDENT`, `USE_KW`, or `STRUCT_DEF`.\n");
        acc.push_str("#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash)]\n");
        acc.push_str("pub enum SyntaxKind {\n");
        for kind in syntax_kinds.iter() {
            write!(acc, "    {},\n", scream(kind)).unwrap();
        }
        acc.push_str("\n");
        acc.push_str("    // Technical SyntaxKinds: they appear temporally during parsing,\n");
        acc.push_str("    // but never end up in the final tree\n");
        acc.push_str("    #[doc(hidden)]\n");
        acc.push_str("    TOMBSTONE,\n");
        acc.push_str("    #[doc(hidden)]\n");
        acc.push_str("    EOF,\n");
        acc.push_str("}\n");
        acc.push_str("pub(crate) use self::SyntaxKind::*;\n");
        acc.push_str("\n");

        // fn info
        acc.push_str("impl SyntaxKind {\n");
        acc.push_str("    pub(crate) fn info(self) -> &'static SyntaxInfo {\n");
        acc.push_str("        match self {\n");
        for kind in syntax_kinds.iter() {
            let sname = scream(kind);
            write!(
                acc,
                "            {sname} => &SyntaxInfo {{ name: \"{sname}\" }},\n",
                sname = sname
            ).unwrap();
        }
        acc.push_str("\n");
        acc.push_str("            TOMBSTONE => &SyntaxInfo { name: \"TOMBSTONE\" },\n");
        acc.push_str("            EOF => &SyntaxInfo { name: \"EOF\" },\n");
        acc.push_str("        }\n");
        acc.push_str("    }\n");

        // fn from_keyword
        acc.push_str("    pub(crate) fn from_keyword(ident: &str) -> Option<SyntaxKind> {\n");
        acc.push_str("        match ident {\n");
        // NB: no contextual_keywords here!
        for kw in self.keywords.iter() {
            write!(acc, "            {:?} => Some({}),\n", kw, kw_token(kw)).unwrap();
        }
        acc.push_str("            _ => None,\n");
        acc.push_str("        }\n");
        acc.push_str("    }\n");
        acc.push_str("}\n");
        acc.push_str("\n");
        acc
    }
}

fn grammar_file() -> PathBuf {
    base_dir().join("grammar.ron")
}

fn generated_file() -> PathBuf {
    base_dir().join("src/syntax_kinds/generated.rs")
}

fn scream(word: &str) -> String {
    word.chars().map(|c| c.to_ascii_uppercase()).collect()
}

fn kw_token(keyword: &str) -> String {
    format!("{}_KW", scream(keyword))
}

fn base_dir() -> PathBuf {
    let dir = env!("CARGO_MANIFEST_DIR");
    PathBuf::from(dir).parent().unwrap().to_owned()
}