@@ -7,7 +7,7 @@ HTMLS_DIR = $(ARXIV_DIR)/htmls
7
7
FIXED_HTMLS_DIR = $(ARXIV_DIR ) /htmls-clean
8
8
TABLES_DIR = $(ARXIV_DIR ) /tables
9
9
10
- ARCHIVES = $(wildcard $(ARCHIVES_DIR ) /** / * .gz)
10
+ ARCHIVES = $(wildcard $(ARCHIVES_DIR ) /** .gz)
11
11
UNPACKS = $(patsubst $(ARCHIVES_DIR ) /% .gz,$(UNPACKED_DIR ) /% ,$(ARCHIVES ) )
12
12
HTMLS = $(patsubst $(ARCHIVES_DIR ) /% .gz,$(HTMLS_DIR ) /% .html,$(ARCHIVES ) )
13
13
FIXED_HTMLS = $(patsubst $(ARCHIVES_DIR ) /% .gz,$(FIXED_HTMLS_DIR ) /% .html,$(ARCHIVES ) )
@@ -18,6 +18,15 @@ $(shell mkdir -p "$(DATA_DIR)" "$(UNPACKED_DIR)" "$(HTMLS_DIR)" "$(FIXED_HTMLS_D
18
18
.PHONY : all
19
19
all : $(ANNOTATIONS_DIR ) /pdfs-urls.csv $(ANNOTATIONS_DIR ) /sources-urls.csv extract_all
20
20
21
+ .PHONY : test
22
+ test : DATA_DIR = test/data
23
+ test :
24
+ mkdir -p $(ARCHIVES_DIR )
25
+ tar czf $(ARCHIVES_DIR ) /paper.gz -C test/src .
26
+ $(MAKE ) DATA_DIR=$(DATA_DIR ) extract_all
27
+ cat $(TABLES_DIR ) /paper/table_01.csv
28
+ diff $(TABLES_DIR ) /paper/table_01.csv test/src/table_01.csv
29
+
21
30
extract_all : $(TABLES )
22
31
23
32
fix_htmls_all : $(FIXED_HTMLS )
@@ -53,6 +62,7 @@ $(ANNOTATIONS_DIR)/%: $(ANNOTATIONS_DIR)/%.gz
53
62
$(ANNOTATIONS_DIR ) /evaluation-tables.json.gz :
54
63
wget https://paperswithcode.com/media/about/evaluation-tables.json.gz -O $@
55
64
65
+
56
66
.PHONY : clean
57
67
clean :
58
68
cd " $( ANNOTATIONS_DIR) " && rm -f * .json * .csv
0 commit comments