diff --git a/src/main/java/org/lobid/resources/run/CulturegraphXmlFilterHbzToJson.java b/src/main/java/org/lobid/resources/run/CulturegraphXmlFilterHbzToJson.java index 5a0635df69..1693c141cd 100644 --- a/src/main/java/org/lobid/resources/run/CulturegraphXmlFilterHbzToJson.java +++ b/src/main/java/org/lobid/resources/run/CulturegraphXmlFilterHbzToJson.java @@ -11,12 +11,12 @@ import org.metafacture.io.ObjectWriter; import org.metafacture.json.JsonEncoder; import org.metafacture.mangling.LiteralToObject; +import org.metafacture.metamorph.Filter; import org.metafacture.metamorph.Metamorph; import org.metafacture.strings.StringReader; import org.metafacture.xml.XmlDecoder; import org.metafacture.xml.XmlElementSplitter; - /** * Filter resources with hbz holdings from culturegraph marcxml, tranform it * into JSON and write this as an elasticsearch bulk json file. @@ -47,6 +47,8 @@ public static void main(String... args) { private static StringReader receiverThread() { final StringReader sr = new StringReader(); sr.setReceiver(new XmlDecoder()).setReceiver(new MarcXmlHandler()) + .setReceiver(new Filter( + new Metamorph("src/main/resources/morph-cg-to-es.xml"))) .setReceiver( new Metamorph("src/main/resources/morph-cg-to-es.xml")) .setReceiver(new JsonEncoder()) diff --git a/src/main/resources/morph-cg-to-es.xml b/src/main/resources/morph-cg-to-es.xml index 831b83a7be..98fdba7890 100644 --- a/src/main/resources/morph-cg-to-es.xml +++ b/src/main/resources/morph-cg-to-es.xml @@ -12,11 +12,15 @@ - + - - + + + + + + diff --git a/src/test/java/org/lobid/resources/CulturegraphXmlFilterHbzToJsonTest.java b/src/test/java/org/lobid/resources/CulturegraphXmlFilterHbzToJsonTest.java index 03aaa5f5e0..85b00ef3f6 100644 --- a/src/test/java/org/lobid/resources/CulturegraphXmlFilterHbzToJsonTest.java +++ b/src/test/java/org/lobid/resources/CulturegraphXmlFilterHbzToJsonTest.java @@ -18,6 +18,7 @@ import org.metafacture.io.ObjectWriter; import org.metafacture.json.JsonEncoder; import org.metafacture.mangling.LiteralToObject; +import org.metafacture.metamorph.Filter; import org.metafacture.metamorph.Metamorph; import org.metafacture.strings.StringReader; import org.metafacture.xml.XmlDecoder; @@ -76,8 +77,9 @@ static void et() { private static StringReader receiverThread() { final StringReader sr = new StringReader(); sr.setReceiver(new XmlDecoder()).setReceiver(new MarcXmlHandler()) - .setReceiver( - new Metamorph("src/main/resources/morph-cg-to-es.xml")) + .setReceiver(new Filter( + new Metamorph("src/main/resources/morph-cg-to-es.xml"))) + .setReceiver(new Metamorph("src/main/resources/morph-cg-to-es.xml")) .setReceiver(new JsonEncoder()) .setReceiver(new JsonToElasticsearchBulk("rvk", "cg")) .setReceiver(new ObjectWriter<>(JSON_TEST_FILE)); diff --git a/src/test/resources/aggregate_auslieferung_20191212.small.marcxml b/src/test/resources/aggregate_auslieferung_20191212.small.marcxml index cf25427d3f..88f5e7130d 100644 --- a/src/test/resources/aggregate_auslieferung_20191212.small.marcxml +++ b/src/test/resources/aggregate_auslieferung_20191212.small.marcxml @@ -29,7 +29,7 @@ 8\p - (DE-605)HT013317056 + (DE-608)HT013317056 1\p @@ -550,7 +550,7 @@ 9\p - DE-605 + DE-608 1\p @@ -1444,7 +1444,7 @@ 13\p - DE-605 + DE-608 1\p 7\p 9\p diff --git a/src/test/resources/jsonld-cg/bulk.ndjson b/src/test/resources/jsonld-cg/bulk.ndjson index 06f08f615c..f9cbcdb509 100644 --- a/src/test/resources/jsonld-cg/bulk.ndjson +++ b/src/test/resources/jsonld-cg/bulk.ndjson @@ -1,4 +1,2 @@ {"index":{"_index":"cg","_type":"rvk","_id":null}} -{"rvk":["LG 8100","56","13","6,15","48","LS 30100","FB 4019","LQ 88600","LR 11121","6,12","6,11","LS 16200","13.1c","930","3.1","900","15.07","60","15.17","16.3","63","NH 6880","24.50","9,2"],"hbzId":["HT013317056"]} -{"index":{"_index":"cg","_type":"rvk","_id":null}} -{"rvk":["4.7p","CI 5837","CI 1125","CI 5604","CI 5603","100","IH 34381","CI 1100","10.02","CI 5310","08.31","5,1","EC 2430","10"],"hbzId":["HT013166356","HT018625006","TT000577460"]} +{"rvk":["4.7p","CI 5837","CI 1125","CI 5604","CI 5603","100","IH 34381","CI 1100","10.02","CI 5310","08.31","5,1","EC 2430","10"],"id":["TT000577460","HT018625006","HT013166356"]}