diff --git a/.gitignore b/.gitignore index 67f134e..49cb4f0 100644 --- a/.gitignore +++ b/.gitignore @@ -3,12 +3,15 @@ test-pascal.ini tmp*.json Tests.md -data/corpus-simple.json -data/corpus-simple-etab.json -data/corpus-simple-instituts.json -data/corpus-simple-label-pascal.json -data/corpus-simple-pascal.json -data/corpus-simple-cnrs.json +data/*corpus.json +data/*corpus-simple.json +data/*corpus-simple-etab.json +data/*corpus-simple-instituts.json +data/*corpus-simple-label-pascal.json +data/*corpus-simple-pascal.json +data/*corpus-simple-cnrs.json +data/*corpus-simple-rnsr.json +data/*corpus-simple-teeft-en.json data/*.gz corpus_WoS_vol1.json corpus-test.json diff --git a/Makefile b/Makefile index 9811ea6..aea3f4a 100644 --- a/Makefile +++ b/Makefile @@ -3,29 +3,29 @@ # See https://tech.davis-hansson.com/p/make/#change-some-make-defaults .DELETE_ON_ERROR: -data/corpus-simple-cnrs.json: data/corpus-simple-label-pascal.json +data/09-corpus-simple-cnrs.json: data/08-corpus-simple-label-pascal.json npx ezs detect-cnrs.ini < $< > $@ -data/corpus-simple-label-pascal.json: data/corpus-simple-pascal.json +data/08-corpus-simple-label-pascal.json: data/07-corpus-simple-pascal.json npx ezs extract-pascal-label.ini < $< > $@ -data/corpus-simple-pascal.json: data/corpus-simple-teeft-en.json +data/07-corpus-simple-pascal.json: data/06-corpus-simple-teeft-en.json npx ezs enrich-pascal.ini < $< > $@ -data/corpus-simple-teeft-en.json: data/corpus-simple-instituts.json +data/06-corpus-simple-teeft-en.json: data/05-corpus-simple-instituts.json npx ezs enrich-teeft-en.ini < $< > $@ -data/corpus-simple-instituts.json: data/corpus-simple-etab.json +data/05-corpus-simple-instituts.json: data/04-corpus-simple-etab.json npx ezs enrich-institutes.ini < $< > $@ -data/corpus-simple-etab.json: data/corpus-simple-rnsr.json +data/04-corpus-simple-etab.json: data/03-corpus-simple-rnsr.json npx ezs enrich-etab.ini < $< > $@ -data/corpus-simple-rnsr.json: data/corpus-simple.json +data/03-corpus-simple-rnsr.json: data/02-corpus-simple.json npx ezs enrich-rnsr.ini < $< > $@ -data/corpus-simple.json: data/corpus.json +data/02-corpus-simple.json: data/01-corpus.json npx ezs extract-fields.ini < $< > $@ -data/corpus.json: dois.txt +data/01-corpus.json: dois.txt npx ezs harvest-from-doi.ini < $< > $@