batchloader improvements for Mimic upload

This commit is contained in:
Grahame Grieve 2019-11-10 21:04:55 +11:00
parent 3ae115c62d
commit 9ffdf6e81c
2 changed files with 146 additions and 96 deletions

View File

@ -23,14 +23,18 @@ package org.hl7.fhir.dstu3.utils;
import java.io.File; import java.io.File;
import java.io.FileInputStream; import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.IOException; import java.io.IOException;
import java.net.URISyntaxException; import java.net.URISyntaxException;
import java.text.SimpleDateFormat;
import java.util.Date;
import java.util.UUID; import java.util.UUID;
import java.util.zip.ZipEntry; import java.util.zip.ZipEntry;
import java.util.zip.ZipInputStream; import java.util.zip.ZipInputStream;
import org.hl7.fhir.dstu3.formats.IParser; import org.hl7.fhir.dstu3.formats.IParser;
import org.hl7.fhir.dstu3.formats.JsonParser; import org.hl7.fhir.dstu3.formats.JsonParser;
import org.hl7.fhir.dstu3.formats.XmlParser;
import org.hl7.fhir.dstu3.model.Bundle; import org.hl7.fhir.dstu3.model.Bundle;
import org.hl7.fhir.dstu3.model.Bundle.BundleEntryComponent; import org.hl7.fhir.dstu3.model.Bundle.BundleEntryComponent;
import org.hl7.fhir.dstu3.model.Bundle.BundleType; import org.hl7.fhir.dstu3.model.Bundle.BundleType;
@ -38,105 +42,147 @@ import org.hl7.fhir.dstu3.model.Bundle.HTTPVerb;
import org.hl7.fhir.dstu3.model.Resource; import org.hl7.fhir.dstu3.model.Resource;
import org.hl7.fhir.dstu3.utils.client.FHIRToolingClient; import org.hl7.fhir.dstu3.utils.client.FHIRToolingClient;
import org.hl7.fhir.exceptions.FHIRException; import org.hl7.fhir.exceptions.FHIRException;
import org.hl7.fhir.exceptions.FHIRFormatError;
import org.hl7.fhir.utilities.IniFile;
import org.hl7.fhir.utilities.Utilities; import org.hl7.fhir.utilities.Utilities;
public class BatchLoader { public class BatchLoader {
public static void main(String[] args) throws IOException, Exception { public static void main(String[] args) throws IOException, Exception {
if (args.length < 4) { if (args.length < 3) {
System.out.println("Batch uploader takes 4 parameters in order: server base url, file/folder to upload, xml/json, and batch size"); System.out.println("Batch uploader takes 3 parameters in order: server base url, file/folder to upload, and batch size");
} else { } else {
String server = args[0]; String server = args[0];
String file = args[1]; String file = args[1];
IParser p = new JsonParser(); // args[2].equals("json") ? new JsonParser() : new XmlParser(); int size = Integer.parseInt(args[2]);
int size = Integer.parseInt(args[3]); if (file.endsWith(".xml")) {
size = 500; throw new FHIRException("Unimplemented file type "+file);
if (file.endsWith(".xml")) { } else if (file.endsWith(".json")) {
throw new FHIRException("Unimplemented file type "+file); throw new FHIRException("Unimplemented file type "+file);
} else if (file.endsWith(".json")) { // } else if (file.endsWith(".zip")) {
throw new FHIRException("Unimplemented file type "+file); // LoadZipFile(server, file, p, size, 0, -1);
} else if (file.endsWith(".zip")) { } else if (new File(file).isDirectory()) {
LoadZipFile(server, file, p, size, 0, -1); LoadDirectory(server, file, size);
} else if (new File(file).isDirectory()) { } else
LoadDirectory(server, file, p, size); throw new FHIRException("Unknown file type "+file);
} else }
throw new FHIRException("Unknown file type "+file);
}
}
private static void LoadDirectory(String server, String file, IParser p, int size) throws IOException, Exception {
// LoadZipFile(server, Utilities.path(file, "Patient.json.zip"), p, size, 1000, -1);
// LoadZipFile(server, Utilities.path(file, "Binary.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "DocumentReference.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "Encounter.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "Organization.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "Procedure.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "AllergyIntolerance.json.zip"), p, size, 1500, -1);
// LoadZipFile(server, Utilities.path(file, "Condition.json.zip"), p, size, 0, -1);
LoadZipFile(server, Utilities.path(file, "Immunization.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "MedicationStatement.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "Observation-res.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "Observation-sh.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "Observation-vs.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "Observation-gen.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "List.json.zip"), p, size, 6500, -1);
// LoadZipFile(server, Utilities.path(file, "List-res.json.zip"), p, size, 0, -1);
// LoadZipFile(server, Utilities.path(file, "List-vs.json.zip"), p, size, 0, -1);
} }
private static void LoadDirectory(String server, String folder, int size) throws IOException, Exception {
private static void LoadZipFile(String server, String file, IParser p, int size, int start, int end) throws IOException, Exception { System.out.print("Connecting to "+server+".. ");
System.out.println("Load Zip file "+file); FHIRToolingClient client = new FHIRToolingClient(server);
Bundle b = new Bundle(); System.out.println("Done");
b.setType(BundleType.COLLECTION);
b.setId(UUID.randomUUID().toString().toLowerCase()); IniFile ini = new IniFile(Utilities.path(folder, "batch-load-progress.ini"));
ZipInputStream zip = new ZipInputStream(new FileInputStream(file)); for (File f : new File(folder).listFiles()) {
ZipEntry entry; if (f.getName().endsWith(".json") || f.getName().endsWith(".xml")) {
while((entry = zip.getNextEntry())!=null) if (!ini.getBooleanProperty("finished", f.getName())) {
{ sendFile(client, f, size, ini);
try { }
Resource r = p.parse(zip); }
b.addEntry().setResource(r);
} catch (Exception e) {
throw new Exception("Error parsing "+entry.getName()+": "+e.getMessage(), e);
}
} }
loadBundle(server, b, size, start, end); }
}
private static int loadBundle(String server, Bundle b, int size, int start, int end) throws URISyntaxException { private static void sendFile(FHIRToolingClient client, File f, int size, IniFile ini) throws FHIRFormatError, FileNotFoundException, IOException {
System.out.println("Post to "+server+". size = "+Integer.toString(size)+", start = "+Integer.toString(start)+", total = "+Integer.toString(b.getEntry().size())); long ms = System.currentTimeMillis();
FHIRToolingClient client = new FHIRToolingClient(server); System.out.print("Loading "+f.getName()+".. ");
int c = start; IParser parser = f.getName().endsWith(".json") ? new JsonParser() : new XmlParser();
if (end == -1) Resource res = parser.parse(new FileInputStream(f));
end = b.getEntry().size(); System.out.println(" done: ("+Long.toString(System.currentTimeMillis()-ms)+" ms)");
while (c < end) {
Bundle bt = new Bundle(); if (res instanceof Bundle) {
bt.setType(BundleType.BATCH); Bundle bnd = (Bundle) res;
bt.setId(UUID.randomUUID().toString().toLowerCase()); int cursor = ini.hasProperty("progress", f.getName()) ? ini.getIntegerProperty("progress", f.getName()) : 0;
for (int i = c; i < Math.min(b.getEntry().size(), c+size); i++) { while (cursor < bnd.getEntry().size()) {
BundleEntryComponent be = bt.addEntry(); Bundle bt = new Bundle();
be.setResource(b.getEntry().get(i).getResource()); bt.setType(BundleType.BATCH);
be.getRequest().setMethod(HTTPVerb.PUT); bt.setId(UUID.randomUUID().toString().toLowerCase());
be.getRequest().setUrl(be.getResource().getResourceType().toString()+"/"+be.getResource().getId()); for (int i = cursor; i < Math.min(bnd.getEntry().size(), cursor+size); i++) {
} BundleEntryComponent be = bt.addEntry();
System.out.print(" posting.."); be.setResource(bnd.getEntry().get(i).getResource());
long ms = System.currentTimeMillis(); be.getRequest().setMethod(HTTPVerb.PUT);
Bundle resp = client.transaction(bt); be.getRequest().setUrl(be.getResource().getResourceType().toString()+"/"+be.getResource().getId());
}
for (int i = 0; i < resp.getEntry().size(); i++) { System.out.print(f.getName()+" ("+cursor+"/"+bnd.getEntry().size()+"): ");
BundleEntryComponent t = resp.getEntry().get(i); ms = System.currentTimeMillis();
if (!t.getResponse().getStatus().startsWith("2")) { Bundle resp = client.transaction(bt);
System.out.println("failed status at "+Integer.toString(i)+": "+t.getResponse().getStatus());
return c+i; int ncursor = cursor+size;
} for (int i = 0; i < resp.getEntry().size(); i++) {
} BundleEntryComponent t = resp.getEntry().get(i);
c = c + size; if (!t.getResponse().getStatus().startsWith("2")) {
System.out.println(" ..done: "+Integer.toString(c)+". ("+Long.toString(System.currentTimeMillis()-ms)+" ms)"); System.out.println("failed status at "+Integer.toString(i)+": "+t.getResponse().getStatus());
} ncursor = cursor+i-1;
System.out.println(" done"); break;
return c; }
} }
cursor = ncursor;
System.out.println(" .. done: ("+Long.toString(System.currentTimeMillis()-ms)+" ms) "+SimpleDateFormat.getInstance().format(new Date()));
ini.setIntegerProperty("progress", f.getName(), cursor, null);
ini.save();
}
ini.setBooleanProperty("finished", f.getName(), true, null);
ini.save();
} else {
client.update(res);
ini.setBooleanProperty("finished", f.getName(), true, null);
ini.save();
}
}
//
// private static void LoadZipFile(String server, String file, IParser p, int size, int start, int end) throws IOException, Exception {
// System.out.println("Load Zip file "+file);
// Bundle b = new Bundle();
// b.setType(BundleType.COLLECTION);
// b.setId(UUID.randomUUID().toString().toLowerCase());
// ZipInputStream zip = new ZipInputStream(new FileInputStream(file));
// ZipEntry entry;
// while((entry = zip.getNextEntry())!=null)
// {
// try {
// Resource r = p.parse(zip);
// b.addEntry().setResource(r);
// } catch (Exception e) {
// throw new Exception("Error parsing "+entry.getName()+": "+e.getMessage(), e);
// }
// }
// loadBundle(server, b, size, start, end);
// }
//
//
// private static int loadBundle(String server, Bundle b, int size, int start, int end) throws URISyntaxException {
// System.out.println("Post to "+server+". size = "+Integer.toString(size)+", start = "+Integer.toString(start)+", total = "+Integer.toString(b.getEntry().size()));
// FHIRToolingClient client = new FHIRToolingClient(server);
// int c = start;
// if (end == -1)
// end = b.getEntry().size();
// while (c < end) {
// Bundle bt = new Bundle();
// bt.setType(BundleType.BATCH);
// bt.setId(UUID.randomUUID().toString().toLowerCase());
// for (int i = c; i < Math.min(b.getEntry().size(), c+size); i++) {
// BundleEntryComponent be = bt.addEntry();
// be.setResource(b.getEntry().get(i).getResource());
// be.getRequest().setMethod(HTTPVerb.PUT);
// be.getRequest().setUrl(be.getResource().getResourceType().toString()+"/"+be.getResource().getId());
// }
// System.out.print(" posting..");
// long ms = System.currentTimeMillis();
// Bundle resp = client.transaction(bt);
//
// for (int i = 0; i < resp.getEntry().size(); i++) {
// BundleEntryComponent t = resp.getEntry().get(i);
// if (!t.getResponse().getStatus().startsWith("2")) {
// System.out.println("failed status at "+Integer.toString(i)+": "+t.getResponse().getStatus());
// return c+i;
// }
// }
// c = c + size;
// System.out.println(" ..done: "+Integer.toString(c)+". ("+Long.toString(System.currentTimeMillis()-ms)+" ms)");
// }
// System.out.println(" done");
// return c;
// }
} }

View File

@ -26,6 +26,8 @@ import java.io.FileInputStream;
import java.io.FileNotFoundException; import java.io.FileNotFoundException;
import java.io.IOException; import java.io.IOException;
import java.net.URISyntaxException; import java.net.URISyntaxException;
import java.text.SimpleDateFormat;
import java.util.Date;
import java.util.UUID; import java.util.UUID;
import java.util.zip.ZipEntry; import java.util.zip.ZipEntry;
import java.util.zip.ZipInputStream; import java.util.zip.ZipInputStream;
@ -84,10 +86,11 @@ public class BatchLoader {
private static void sendFile(FHIRToolingClient client, File f, int size, IniFile ini) throws FHIRFormatError, FileNotFoundException, IOException { private static void sendFile(FHIRToolingClient client, File f, int size, IniFile ini) throws FHIRFormatError, FileNotFoundException, IOException {
long ms = System.currentTimeMillis();
System.out.print("Loading "+f.getName()+".. "); System.out.print("Loading "+f.getName()+".. ");
IParser parser = f.getName().endsWith(".json") ? new JsonParser() : new XmlParser(); IParser parser = f.getName().endsWith(".json") ? new JsonParser() : new XmlParser();
Resource res = parser.parse(new FileInputStream(f)); Resource res = parser.parse(new FileInputStream(f));
System.out.println("Done. Size = "+size); System.out.println(" done: ("+Long.toString(System.currentTimeMillis()-ms)+" ms)");
if (res instanceof Bundle) { if (res instanceof Bundle) {
Bundle bnd = (Bundle) res; Bundle bnd = (Bundle) res;
@ -103,19 +106,20 @@ public class BatchLoader {
be.getRequest().setUrl(be.getResource().getResourceType().toString()+"/"+be.getResource().getId()); be.getRequest().setUrl(be.getResource().getResourceType().toString()+"/"+be.getResource().getId());
} }
System.out.print(f.getName()+" ("+cursor+"/"+bnd.getEntry().size()+"): "); System.out.print(f.getName()+" ("+cursor+"/"+bnd.getEntry().size()+"): ");
long ms = System.currentTimeMillis(); ms = System.currentTimeMillis();
Bundle resp = client.transaction(bt); Bundle resp = client.transaction(bt);
cursor = cursor+size; int ncursor = cursor+size;
for (int i = 0; i < resp.getEntry().size(); i++) { for (int i = 0; i < resp.getEntry().size(); i++) {
BundleEntryComponent t = resp.getEntry().get(i); BundleEntryComponent t = resp.getEntry().get(i);
if (!t.getResponse().getStatus().startsWith("2")) { if (!t.getResponse().getStatus().startsWith("2")) {
System.out.println("failed status at "+Integer.toString(i)+": "+t.getResponse().getStatus()); System.out.println("failed status at "+Integer.toString(i)+": "+t.getResponse().getStatus());
cursor = cursor+i-1; ncursor = cursor+i-1;
break; break;
} }
} }
System.out.println(" .. done: ("+Long.toString(System.currentTimeMillis()-ms)+" ms)"); cursor = ncursor;
System.out.println(" .. done: ("+Long.toString(System.currentTimeMillis()-ms)+" ms) "+SimpleDateFormat.getInstance().format(new Date()));
ini.setIntegerProperty("progress", f.getName(), cursor, null); ini.setIntegerProperty("progress", f.getName(), cursor, null);
ini.save(); ini.save();
} }