tree-sitter/update: factor repo list into nix

We want the ability to add different orga repos as well, and that is a
lot easier on the nix level.
This commit is contained in:
Profpatsch 2020-12-26 20:11:43 +01:00
parent a32c5d90e7
commit d2988dac8e
2 changed files with 65 additions and 57 deletions

View File

@ -1,6 +1,6 @@
{ lib, stdenv
, fetchgit, fetchFromGitHub, fetchurl
, writeShellScript, runCommand, which
, writeShellScript, runCommand, which, formats
, rustPlatform, jq, nix-prefetch-git, xe, curl, emscripten
, Security
, callPackage
@ -29,7 +29,7 @@ let
};
update-all-grammars = import ./update.nix {
inherit writeShellScript nix-prefetch-git curl jq xe src;
inherit writeShellScript nix-prefetch-git curl jq xe src formats;
};
fetchGrammar = (v: fetchgit {inherit (v) url rev sha256 fetchSubmodules; });

View File

@ -1,72 +1,80 @@
{ writeShellScript, nix-prefetch-git
{ writeShellScript, nix-prefetch-git, formats
, curl, jq, xe
, src }:
let
# Grammars we want to fetch from the tree-sitter github orga
knownTreeSitterOrgGrammarRepos = [
"tree-sitter-javascript"
"tree-sitter-c"
"tree-sitter-swift"
"tree-sitter-json"
"tree-sitter-cpp"
"tree-sitter-ruby"
"tree-sitter-razor"
"tree-sitter-go"
"tree-sitter-c-sharp"
"tree-sitter-python"
"tree-sitter-typescript"
"tree-sitter-rust"
"tree-sitter-bash"
"tree-sitter-php"
"tree-sitter-java"
"tree-sitter-scala"
"tree-sitter-ocaml"
"tree-sitter-julia"
"tree-sitter-agda"
"tree-sitter-fluent"
"tree-sitter-html"
"tree-sitter-haskell"
"tree-sitter-regex"
"tree-sitter-css"
"tree-sitter-verilog"
"tree-sitter-jsdoc"
"tree-sitter-ql"
"tree-sitter-embedded-template"
];
# repos of the tree-sitter github orga we want to ignore (not grammars)
ignoredTreeSitterOrgRepos = [
"tree-sitter"
"tree-sitter-cli"
# this is the haskell language bindings, tree-sitter-haskell is the grammar
"haskell-tree-sitter"
# this is the ruby language bindings, tree-sitter-ruby is the grammar
"ruby-tree-sitter"
# this is the (unmaintained) rust language bindings, tree-sitter-rust is the grammar
"rust-tree-sitter"
# this is the nodejs language bindings, tree-sitter-javascript is the grammar
"node-tree-sitter"
# this is the python language bindings, tree-sitter-python is the grammar
"py-tree-sitter"
# afl fuzzing for tree sitter
"afl-tree-sitter"
# archived
"highlight-schema"
# website
"tree-sitter.github.io"
];
jsonFile = name: val: (formats.json {}).generate name val;
# check in the list of grammars, whether we know all of them.
checkKnownGrammars = writeShellScript "get-grammars.sh" ''
set -euo pipefail
known='
[ "tree-sitter-javascript"
, "tree-sitter-c"
, "tree-sitter-swift"
, "tree-sitter-json"
, "tree-sitter-cpp"
, "tree-sitter-ruby"
, "tree-sitter-razor"
, "tree-sitter-go"
, "tree-sitter-c-sharp"
, "tree-sitter-python"
, "tree-sitter-typescript"
, "tree-sitter-rust"
, "tree-sitter-bash"
, "tree-sitter-php"
, "tree-sitter-java"
, "tree-sitter-scala"
, "tree-sitter-ocaml"
, "tree-sitter-julia"
, "tree-sitter-agda"
, "tree-sitter-fluent"
, "tree-sitter-html"
, "tree-sitter-haskell"
, "tree-sitter-regex"
, "tree-sitter-css"
, "tree-sitter-verilog"
, "tree-sitter-jsdoc"
, "tree-sitter-ql"
, "tree-sitter-embedded-template"
]'
ignore='
[ "tree-sitter"
, "tree-sitter-cli"
${/*this is the haskell language bindings, tree-sitter-haskell is the grammar*/""}
, "haskell-tree-sitter"
${/*this is the ruby language bindings, tree-sitter-ruby is the grammar*/""}
, "ruby-tree-sitter"
${/*this is the (unmaintained) rust language bindings, tree-sitter-rust is the grammar*/""}
, "rust-tree-sitter"
${/*this is the nodejs language bindings, tree-sitter-javascript is the grammar*/""}
, "node-tree-sitter"
${/*this is the python language bindings, tree-sitter-python is the grammar*/""}
, "py-tree-sitter"
${/*afl fuzzing for tree sitter*/""}
, "afl-tree-sitter"
${/*archived*/""}
, "highlight-schema"
${/*website*/""}
, "tree-sitter.github.io"
]'
known="${jsonFile "known-tree-sitter-org-grammar-repos" knownTreeSitterOrgGrammarRepos}"
ignore="${jsonFile "ignored-tree-sitter-org-repos" ignoredTreeSitterOrgRepos}"
res=$(${jq}/bin/jq \
--argjson known "$known" \
--argjson ignore "$ignore" \
'. - ($known + $ignore)' \
--slurpfile known "$known" \
--slurpfile ignore "$ignore" \
'. - ($known[0] + $ignore[0])' \
)
if [ ! "$res" == "[]" ]; then
echo "These repositories are neither known nor ignored:" 1>&2
echo "$res" 1>&2
exit 1
fi
printf '%s' "$known"
cat "$known"
'';
# TODO