aboutsummaryrefslogtreecommitdiff
path: root/src/bin/gen.rs
blob: 89609bd77e61fbd04bbeb9e2d6e78bd982128493 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
extern crate serde;
#[macro_use]
extern crate serde_derive;

extern crate file;
extern crate ron;

use std::path::PathBuf;
use std::fmt::Write;

fn main() {
    let grammar = Grammar::read();
    let text = grammar.to_syntax_kinds();
    file::put_text(&generated_file(), &text).unwrap();
}

#[derive(Deserialize)]
struct Grammar {
    keywords: Vec<String>,
    tokens: Vec<String>,
    nodes: Vec<String>,
}

impl Grammar {
    fn read() -> Grammar {
        let text = file::get_text(&grammar_file()).unwrap();
        ron::de::from_str(&text).unwrap()
    }

    fn to_syntax_kinds(&self) -> String {
        let mut acc = String::new();
        acc.push_str("#![allow(bad_style, missing_docs, unreachable_pub)]\n");
        acc.push_str("#![cfg_attr(rustfmt, rustfmt_skip)]\n");
        acc.push_str("//! Generated from grammar.ron\n");
        acc.push_str("use tree::SyntaxInfo;\n");
        acc.push_str("\n");

        let syntax_kinds: Vec<String> = self.keywords
            .iter()
            .map(|kw| kw_token(kw))
            .chain(self.tokens.iter().cloned())
            .chain(self.nodes.iter().cloned())
            .collect();

        // enum SyntaxKind
        acc.push_str("/// The kind of syntax node, e.g. `IDENT`, `USE_KW`, or `STRUCT_DEF`.\n");
        acc.push_str("#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash)]\n");
        acc.push_str("#[repr(u32)]\n");
        acc.push_str("pub enum SyntaxKind {\n");
        for kind in syntax_kinds.iter() {
            write!(acc, "    {},\n", scream(kind)).unwrap();
        }
        acc.push_str("\n");
        acc.push_str("    // Technical SyntaxKinds: they appear temporally during parsing,\n");
        acc.push_str("    // but never end up in the final tree\n");
        acc.push_str("    #[doc(hidden)]\n");
        acc.push_str("    TOMBSTONE,\n");
        acc.push_str("    #[doc(hidden)]\n");
        acc.push_str("    EOF,\n");
        acc.push_str("}\n");
        acc.push_str("pub(crate) use self::SyntaxKind::*;\n");
        acc.push_str("\n");

        // fn info
        acc.push_str("impl SyntaxKind {\n");
        acc.push_str("    pub(crate) fn info(self) -> &'static SyntaxInfo {\n");
        acc.push_str("        match self {\n");
        for kind in syntax_kinds.iter() {
            let sname = scream(kind);
            write!(
                acc,
                "            {sname} => &SyntaxInfo {{ name: \"{sname}\" }},\n",
                sname = sname
            ).unwrap();
        }
        acc.push_str("\n");
        acc.push_str("            TOMBSTONE => &SyntaxInfo { name: \"TOMBSTONE\" },\n");
        acc.push_str("            EOF => &SyntaxInfo { name: \"EOF\" },\n");
        acc.push_str("        }\n");
        acc.push_str("    }\n");
        acc.push_str("}\n");
        acc.push_str("\n");

        // fn ident_to_keyword
        acc.push_str("pub(crate) fn ident_to_keyword(ident: &str) -> Option<SyntaxKind> {\n");
        acc.push_str("    match ident {\n");
        for kw in self.keywords.iter() {
            write!(acc, "        {:?} => Some({}),\n", kw, kw_token(kw)).unwrap();
        }
        acc.push_str("        _ => None,\n");
        acc.push_str("    }\n");
        acc.push_str("}\n");
        acc
    }
}

fn grammar_file() -> PathBuf {
    let dir = env!("CARGO_MANIFEST_DIR");
    PathBuf::from(dir).join("grammar.ron")
}

fn generated_file() -> PathBuf {
    let dir = env!("CARGO_MANIFEST_DIR");
    PathBuf::from(dir).join("src/syntax_kinds.rs")
}

fn scream(word: &str) -> String {
    word.chars().map(|c| c.to_ascii_uppercase()).collect()
}

fn kw_token(keyword: &str) -> String {
    format!("{}_KW", scream(keyword))
}