xtask/
fetch_queries.rs

1use std::{fs, path::PathBuf};
2
3use anyhow::{anyhow, bail, Context, Result};
4use lazy_regex::regex_captures;
5use once_cell::sync::Lazy;
6
7pub fn run() -> Result<()> {
8    static QUERIES_DIR: Lazy<PathBuf> = Lazy::new(|| crate::WORKSPACE_DIR.join("queries"));
9    for lang in fs::read_dir(&*QUERIES_DIR)? {
10        let lang = lang?;
11        if lang.path().is_file() {
12            continue;
13        }
14        let lang_name = lang.file_name().to_string_lossy().into_owned();
15
16        for file in fs::read_dir(lang.path())? {
17            let file = file?;
18
19            let old_query = fs::read_to_string(file.path())?;
20            let filename = file.file_name().to_string_lossy().into_owned();
21
22            let Some((_, host, user, repo, branch, path)) = regex_captures!(
23                r"^;; Forked from https://(github|gitlab)\.com/([^/]*)/([^/]*)/(?:-/)?(?:blob|tree)/([^/]*)/([^?#\n]*)",
24                &old_query
25            ) else {
26                println!("\x1b[1;33mwarning:\x1b[22m {lang_name}/{filename} does not specify a fork source\x1b[0m");
27                continue;
28            };
29
30            let url = match host {
31                "github" => {
32                    format!("https://raw.githubusercontent.com/{user}/{repo}/{branch}/{path}")
33                }
34                "gitlab" => format!("https://gitlab.com/{user}/{repo}/-/raw/{branch}/{path}"),
35                _ => unreachable!("the regex only allows above options"),
36            };
37            println!("fetching new {lang_name}/{filename} from {url}");
38            let res = reqwest::blocking::get(url).with_context(|| "query request failed")?;
39            let query = match res.status().is_success() {
40                true => res.text()?,
41                false => bail!(
42                    "query request returned non-success status code: {}",
43                    res.status()
44                ),
45            };
46            let query = format!(
47                "{:#}",
48                rsexpr::from_slice_multi(&query).map_err(|errs| anyhow!(errs
49                    .into_iter()
50                    .map(|err| err.to_string())
51                    .collect::<Vec<_>>()
52                    .join(", ")))?
53            );
54            fs::write(file.path().with_file_name(format!("new.{filename}")), query)?;
55        }
56    }
57
58    // look for missing queries
59    let langs_toml_path = crate::WORKSPACE_DIR.join("syntastica-macros/languages.toml");
60    let mut langs_toml = fs::read_to_string(&langs_toml_path)?;
61    for lang in &crate::LANGUAGE_CONFIG.languages {
62        let kinds = match (lang.queries.injections, lang.queries.locals) {
63            (false, false) => &["injections", "locals"][..],
64            (false, true) => &["injections"],
65            (true, false) => &["locals"],
66            (true, true) => &[],
67        };
68
69        for &kind in kinds {
70            let queries = fetch_query(&lang.name, kind)?;
71            if let Some(text) = queries {
72                fs::write(
73                    crate::WORKSPACE_DIR.join(format!("queries/{}/{kind}.scm", lang.name)),
74                    text,
75                )?;
76                println!("found new {kind} queries for {}", lang.name);
77
78                let (before, rest) = langs_toml
79                    .split_once(&format!("\nname = \"{}\"", lang.name))
80                    .expect("language should be lang config");
81                if kind == "injections" {
82                    langs_toml = format!(
83                        "{before}\nname = \"{}\"{}",
84                        lang.name,
85                        rest.replacen("\ninjections = false", "\ninjections = true", 1),
86                    );
87                } else if kind == "locals" {
88                    langs_toml = format!(
89                        "{before}\nname = \"{}\"{}",
90                        lang.name,
91                        rest.replacen("\nlocals = false", "\nlocals = true", 1),
92                    );
93                }
94            }
95        }
96    }
97    fs::write(&langs_toml_path, langs_toml)?;
98
99    Ok(())
100}
101
102fn forked_from(name: &str, file: &str, content: &str) -> String {
103    format!(";; Forked from https://github.com/nvim-treesitter/nvim-treesitter/blob/master/queries/{name}/{file}.scm
104;; Licensed under the Apache License 2.0
105{content}")
106}
107
108pub fn fetch_query(name: &str, kind: &str) -> Result<Option<String>> {
109    const BASE_URL: &str =
110        "https://raw.githubusercontent.com/nvim-treesitter/nvim-treesitter/HEAD/queries";
111    reqwest::blocking::get(format!("{BASE_URL}/{name}/{kind}.scm"))
112        .ok()
113        .and_then(|res| match res.status().is_success() {
114            true => res.text().ok(),
115            false => None,
116        })
117        .map(|query| {
118            Ok::<_, anyhow::Error>(forked_from(
119                name,
120                kind,
121                &format!(
122                    "{:#}",
123                    rsexpr::from_slice_multi(&query)
124                        .map_err(|errs| anyhow!(errs
125                            .into_iter()
126                            .map(|err| err.to_string())
127                            .collect::<Vec<_>>()
128                            .join(", ")))
129                        .context("failed to parse downloaded queries")?
130                ),
131            ))
132        })
133        .transpose()
134}