Build tree-sitter parsers in parallel

edge_only_predecessors
Wilfred Hughes 2021-09-22 22:02:07 +07:00
parent 05d0234061
commit 5991efdcc7
3 changed files with 127 additions and 88 deletions

1
Cargo.lock generated

@ -250,6 +250,7 @@ dependencies = [
"pretty_assertions",
"pretty_env_logger",
"radix-heap",
"rayon",
"regex",
"rustc-hash",
"strsim 0.10.0",

@ -43,6 +43,7 @@ criterion = { version = "0.3", features = ["html_reports"] }
[build-dependencies]
cc="1.0"
rayon = "1.5"
[[bench]]
name = "parse_and_diff"

@ -1,104 +1,141 @@
use rayon::prelude::*;
use std::path::PathBuf;
fn build(package_name: &str, package_dir: &str, extra_files: &[&str]) {
let dir = PathBuf::from(package_dir);
struct TreeSitterParser {
name: String,
src_dir: String,
extra_files: Vec<String>,
}
impl TreeSitterParser {
fn build(&self) {
let dir = PathBuf::from(&self.src_dir);
let mut c_files = vec!["parser.c"];
let mut cpp_files = vec![];
let mut c_files = vec!["parser.c"];
let mut cpp_files = vec![];
for file in extra_files {
if file.ends_with(".c") {
c_files.push(file);
} else {
cpp_files.push(file);
for file in &self.extra_files {
if file.ends_with(".c") {
c_files.push(file);
} else {
cpp_files.push(file);
}
}
}
if !cpp_files.is_empty() {
let mut cpp_build = cc::Build::new();
cpp_build
.include(&dir)
.cpp(true)
.flag("-Wno-unused-parameter")
.flag("-Wno-ignored-qualifiers");
for file in cpp_files {
cpp_build.file(dir.join(file));
if !cpp_files.is_empty() {
let mut cpp_build = cc::Build::new();
cpp_build
.include(&dir)
.cpp(true)
.flag("-Wno-unused-parameter")
.flag("-Wno-ignored-qualifiers");
for file in cpp_files {
cpp_build.file(dir.join(file));
}
cpp_build.compile(&format!("{}-cpp", self.name));
}
cpp_build.compile(&format!("{}-cpp", package_name));
}
let mut build = cc::Build::new();
build.include(&dir).warnings(false); // ignore unused parameter warnings
for file in c_files {
build.file(dir.join(file));
let mut build = cc::Build::new();
build.include(&dir).warnings(false); // ignore unused parameter warnings
for file in c_files {
build.file(dir.join(file));
}
build.compile(&self.name);
}
build.compile(package_name);
}
fn main() {
// Only rerun if files in the vendor/ directory change.
// TODO: use specific source directories instead.
println!("cargo:rerun-if-changed=vendor");
// TODO: build these in parallel.
build("tree-sitter-c", "vendor/tree-sitter-c-src", &[]);
build(
"tree-sitter-cpp",
"vendor/tree-sitter-cpp-src",
&["scanner.cc"],
);
build("tree-sitter-clojure", "vendor/tree-sitter-clojure-src", &[]);
build(
"tree-sitter-css",
"vendor/tree-sitter-css-src",
&["scanner.c"],
);
build("tree-sitter-elisp", "vendor/tree-sitter-elisp-src", &[]);
build(
"tree-sitter-elixir",
"vendor/tree-sitter-elixir-src",
&["scanner.cc"],
);
build("tree-sitter-go", "vendor/tree-sitter-go-src", &[]);
build(
"tree-sitter-haskell",
"vendor/tree-sitter-haskell-src",
&["scanner.cc"],
);
build("tree-sitter-java", "vendor/tree-sitter-java-src", &[]);
build(
"tree-sitter-javascript",
"vendor/tree-sitter-javascript-src",
&["scanner.c"],
);
build("tree-sitter-json", "vendor/tree-sitter-json-src", &[]);
build(
"tree-sitter-ocaml",
"vendor/tree-sitter-ocaml-src/ocaml/src",
&["scanner.cc"],
);
build(
"tree-sitter-ocaml-interface",
"vendor/tree-sitter-ocaml-src/interface/src",
&["scanner.cc"],
);
build(
"tree-sitter-python",
"vendor/tree-sitter-python-src",
&["scanner.cc"],
);
build(
"tree-sitter-rust",
"vendor/tree-sitter-rust-src",
&["scanner.c"],
);
build(
"tree-sitter-tsx",
"vendor/tree-sitter-typescript-src/tsx/src",
&["scanner.c"],
);
build(
"tree-sitter-typescript",
"vendor/tree-sitter-typescript-src/typescript/src",
&["scanner.c"],
);
let parsers = vec![
TreeSitterParser {
name: "tree-sitter-c".into(),
src_dir: "vendor/tree-sitter-c-src".into(),
extra_files: vec![],
},
TreeSitterParser {
name: "tree-sitter-cpp".into(),
src_dir: "vendor/tree-sitter-cpp-src".into(),
extra_files: vec!["scanner.cc".into()],
},
TreeSitterParser {
name: "tree-sitter-clojure".into(),
src_dir: "vendor/tree-sitter-clojure-src".into(),
extra_files: vec![],
},
TreeSitterParser {
name: "tree-sitter-css".into(),
src_dir: "vendor/tree-sitter-css-src".into(),
extra_files: vec!["scanner.c".into()],
},
TreeSitterParser {
name: "tree-sitter-elisp".into(),
src_dir: "vendor/tree-sitter-elisp-src".into(),
extra_files: vec![],
},
TreeSitterParser {
name: "tree-sitter-elixir".into(),
src_dir: "vendor/tree-sitter-elixir-src".into(),
extra_files: vec!["scanner.cc".into()],
},
TreeSitterParser {
name: "tree-sitter-go".into(),
src_dir: "vendor/tree-sitter-go-src".into(),
extra_files: vec![],
},
TreeSitterParser {
name: "tree-sitter-haskell".into(),
src_dir: "vendor/tree-sitter-haskell-src".into(),
extra_files: vec!["scanner.cc".into()],
},
TreeSitterParser {
name: "tree-sitter-java".into(),
src_dir: "vendor/tree-sitter-java-src".into(),
extra_files: vec![],
},
TreeSitterParser {
name: "tree-sitter-javascript".into(),
src_dir: "vendor/tree-sitter-javascript-src".into(),
extra_files: vec!["scanner.c".into()],
},
TreeSitterParser {
name: "tree-sitter-json".into(),
src_dir: "vendor/tree-sitter-json-src".into(),
extra_files: vec![],
},
TreeSitterParser {
name: "tree-sitter-ocaml".into(),
src_dir: "vendor/tree-sitter-ocaml-src/ocaml/src".into(),
extra_files: vec!["scanner.cc".into()],
},
TreeSitterParser {
name: "tree-sitter-ocaml-interface".into(),
src_dir: "vendor/tree-sitter-ocaml-src/interface/src".into(),
extra_files: vec!["scanner.cc".into()],
},
TreeSitterParser {
name: "tree-sitter-python".into(),
src_dir: "vendor/tree-sitter-python-src".into(),
extra_files: vec!["scanner.cc".into()],
},
TreeSitterParser {
name: "tree-sitter-rust".into(),
src_dir: "vendor/tree-sitter-rust-src".into(),
extra_files: vec!["scanner.c".into()],
},
TreeSitterParser {
name: "tree-sitter-tsx".into(),
src_dir: "vendor/tree-sitter-typescript-src/tsx/src".into(),
extra_files: vec!["scanner.c".into()],
},
TreeSitterParser {
name: "tree-sitter-typescript".into(),
src_dir: "vendor/tree-sitter-typescript-src/typescript/src".into(),
extra_files: vec!["scanner.c".into()],
},
];
parsers.par_iter().for_each(|p| p.build());
}