We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4a2ac97 commit caadf9aCopy full SHA for caadf9a
main/resources/example/filter-duplicates.xml
@@ -0,0 +1,13 @@
1
+<?xml version="1.0" encoding="UTF-8"?>
2
+<metamorph xmlns="http://www.culturegraph.org/metamorph"
3
+ version="1" entityMarker=".">
4
+ <meta>
5
+ <name>Filter out records which contain only one hash</name>
6
+ </meta>
7
+
8
+ <rules>
9
+ <data source="SHA1" name="MATCH">
10
+ <occurrence only="moreThen 1" />
11
+ </data>
12
+ </rules>
13
+</metamorph>
main/resources/example/find-duplicate-files.flux
@@ -0,0 +1,11 @@
+default in = ".";
+in
+|walk-filetree
+|digest-file("sha1")
+|sort-triples(by="OBJECT")
+|reorder-triple(subjectFrom="object", objectFrom="subject")
+|collect-triples
+|filter(FLUX_DIR + "filter-duplicates.xml")
+|encode-formeta(style="multiline")
+|write("stdout");
0 commit comments