1 /*******************************************************************************
2 * Copyright (c) 2012, 2017 Association for Decentralized Information Management
4 * All rights reserved. This program and the accompanying materials
5 * are made available under the terms of the Eclipse Public License v1.0
6 * which accompanies this distribution, and is available at
7 * http://www.eclipse.org/legal/epl-v10.html
10 * VTT Technical Research Centre of Finland - initial API and implementation
11 * Semantum Oy - e.g. #7016
12 *******************************************************************************/
13 package org.simantics.graph.db;
15 import java.io.DataInput;
16 import java.io.IOException;
17 import java.io.InputStream;
18 import java.util.ArrayList;
19 import java.util.Collections;
20 import java.util.HashMap;
21 import java.util.HashSet;
24 import java.util.TreeMap;
26 import org.simantics.databoard.Bindings;
27 import org.simantics.databoard.adapter.AdaptException;
28 import org.simantics.databoard.binding.Binding;
29 import org.simantics.databoard.binding.mutable.Variant;
30 import org.simantics.databoard.serialization.Serializer;
31 import org.simantics.databoard.type.Datatype;
32 import org.simantics.databoard.util.URIStringUtils;
33 import org.simantics.db.ReadGraph;
34 import org.simantics.db.Resource;
35 import org.simantics.db.Session;
36 import org.simantics.db.VirtualGraph;
37 import org.simantics.db.WriteOnlyGraph;
38 import org.simantics.db.common.WriteBindings;
39 import org.simantics.db.common.procedure.adapter.TransientCacheAsyncListener;
40 import org.simantics.db.common.request.PossibleIndexRoot;
41 import org.simantics.db.common.uri.UnescapedChildMapOfResource;
42 import org.simantics.db.common.utils.Logger;
43 import org.simantics.db.exception.DatabaseException;
44 import org.simantics.db.service.ClusterBuilder2;
45 import org.simantics.db.service.ClusterBuilderFactory;
46 import org.simantics.db.service.ClusteringSupport;
47 import org.simantics.db.service.SerialisationSupport;
48 import org.simantics.db.service.XSupport;
49 import org.simantics.graph.db.TransferableGraphSource.TransferableGraphSourceProcedure;
50 import org.simantics.graph.db.TransferableGraphSource.TransferableGraphSourceValueProcedure;
51 import org.simantics.graph.representation.Extensions;
52 import org.simantics.graph.representation.External;
53 import org.simantics.graph.representation.Identity;
54 import org.simantics.graph.representation.IdentityDefinition;
55 import org.simantics.graph.representation.Internal;
56 import org.simantics.graph.representation.Optional;
57 import org.simantics.graph.representation.Root;
58 import org.simantics.graph.representation.TransferableGraphUtils;
59 import org.simantics.graph.utils.TGResourceUtil;
60 import org.simantics.graph.utils.TGResourceUtil.LongAdapter;
61 import org.simantics.utils.datastructures.Pair;
62 import org.slf4j.LoggerFactory;
64 import gnu.trove.map.TIntObjectMap;
65 import gnu.trove.map.hash.TIntObjectHashMap;
67 public class StreamingTransferableGraphImportProcess implements TransferableGraphImporter {
69 private static final org.slf4j.Logger LOGGER = LoggerFactory.getLogger(StreamingTransferableGraphImportProcess.class);
72 TransferableGraphSource tg;
74 IImportAdvisor2 advisor;
75 TGStatusMonitor monitor;
76 ClusterBuilder2 builder;
77 final TGResourceUtil resourceUtil = new TGResourceUtil();
81 Map<String,Integer> allMissingExternals = new HashMap<>();
82 Set<String> missingExternals = new HashSet<>();
83 Map<String,Resource> resolvedParents = new HashMap<>();
84 TIntObjectHashMap<Resource> existingInternalMap = new TIntObjectHashMap<>();
87 Identity[] identities;
88 TreeMap<String, Variant> extensions;
93 Resource ExternalEntity;
102 public StreamingTransferableGraphImportProcess(Session session, VirtualGraph vg, TransferableGraphSource tg, IImportAdvisor2 advisor) {
103 this(session, vg, tg, advisor, null);
106 public StreamingTransferableGraphImportProcess(Session session, VirtualGraph vg, TransferableGraphSource tg, IImportAdvisor2 advisor, TGStatusMonitor monitor) {
109 this.advisor = advisor;
110 this.monitor = monitor;
113 private int updatePercentage(int percentage, int done, int total) {
114 if (monitor != null && (done & 63) == 0) {
115 int current = 100*done / total;
116 if (current > percentage) {
117 percentage = current;
118 monitor.status(percentage);
124 public void readIdentities(ReadGraph g) throws Exception {
125 extensions = tg.getExtensions();
126 resourceCount = tg.getResourceCount();
127 identities = new Identity[tg.getIdentityCount()];
128 tg.forIdentities(g, new TransferableGraphSourceProcedure<Identity>() {
133 public void execute(Identity value) throws Exception {
134 identities[counter++] = value;
139 public void findBuiltins(WriteOnlyGraph g) throws DatabaseException {
140 RootLibrary = g.getBuiltin("http:/");
141 String = g.getBuiltin(CoreInitialization.LAYER0 + "String");
142 Library = g.getBuiltin(CoreInitialization.LAYER0 + "Library");
143 InstanceOf = g.getBuiltin(CoreInitialization.LAYER0 + "InstanceOf");
144 ConsistsOf = g.getBuiltin(CoreInitialization.LAYER0 + "ConsistsOf");
145 PartOf = g.getBuiltin(CoreInitialization.LAYER0 + "PartOf");
146 HasName = g.getBuiltin(CoreInitialization.LAYER0 + "HasName");
147 NameOf = g.getBuiltin(CoreInitialization.LAYER0 + "NameOf");
148 ExternalEntity = g.getBuiltin(CoreInitialization.LAYER0 + "ExternalEntity");
151 public void findBuiltins(ReadGraph g) throws DatabaseException {
152 RootLibrary = g.getBuiltin("http:/");
153 String = g.getBuiltin(CoreInitialization.LAYER0 + "String");
154 Library = g.getBuiltin(CoreInitialization.LAYER0 + "Library");
155 InstanceOf = g.getBuiltin(CoreInitialization.LAYER0 + "InstanceOf");
156 ConsistsOf = g.getBuiltin(CoreInitialization.LAYER0 + "ConsistsOf");
157 PartOf = g.getBuiltin(CoreInitialization.LAYER0 + "PartOf");
158 HasName = g.getBuiltin(CoreInitialization.LAYER0 + "HasName");
159 NameOf = g.getBuiltin(CoreInitialization.LAYER0 + "NameOf");
160 ExternalEntity = g.getBuiltin(CoreInitialization.LAYER0 + "ExternalEntity");
163 void addMissing(int handleIndex, String external) {
164 allMissingExternals.put(external, handleIndex);
165 Set<String> removals = new HashSet<>();
166 for(String ext : missingExternals) if(ext.startsWith(external + "/")) return;
167 for(String ext : missingExternals) if(external.startsWith(ext + "/")) removals.add(ext);
168 missingExternals.removeAll(removals);
169 missingExternals.add(external);
172 void prepare(ReadGraph graph) throws Exception {
174 Resource target = advisor.getTarget();
176 indexRoot = graph.syncRequest(new PossibleIndexRoot(target));
179 readIdentities(graph);
181 // System.err.println("ext: " + extensions);
182 // System.err.println("rc: " + resourceCount);
183 // System.err.println("ic: " + identities.length);
185 ClusterBuilderFactory factory = graph.getService(ClusterBuilderFactory.class);
186 ClusterBuilder2 builder = factory.create(vg, false);
188 this.handles = new int[resourceCount];
189 TIntObjectMap<Identity> identityMap = TransferableGraphUtils.mapIdentities(identities);
191 for(Identity identity : identities) {
192 IdentityDefinition definition = identity.definition;
193 if(definition instanceof External) {
194 External def = (External)definition;
195 if(def.parent == -1) {
196 handles[identity.resource] = builder.handle(RootLibrary);
198 if("@inverse".equals(def.name)) {
199 int parent = handles[def.parent];
200 int child = builder.handle(graph.getInverse(builder.resource(parent)));
201 handles[identity.resource] = child;
203 int handle = handles[def.parent];
204 Resource parent = handle != 0 ? builder.resource(handle) : null;
205 // TODO: escape should be removed when names become well-behaving
207 resolvedParents.put(graph.getURI(parent), parent);
208 Map<String,Resource> childMap = graph
209 .syncRequest(new UnescapedChildMapOfResource(parent),
210 TransientCacheAsyncListener.instance());
211 Resource child = childMap.get(def.name);
213 addMissing(identity.resource, graph.getURI(parent) + "/" + URIStringUtils.escape(def.name));
215 handles[identity.resource] = builder.handle(child);
218 addMissing(identity.resource, TransferableGraphUtils.getURI(resourceCount, identityMap, def.parent) + "/" + URIStringUtils.escape(def.name));
223 else if(definition instanceof Internal) {
224 String uri = TransferableGraphUtils.getURI(resourceCount, identityMap, identity.resource);
225 Resource existing = graph.getPossibleResource(uri);
226 if(existing != null) {
227 existingInternalMap.put(identity.resource, existing);
230 else if(definition instanceof Root) {
231 Root root = (Root)definition;
232 if(root.name.equals(""))
233 handles[identity.resource] = builder.handle(RootLibrary);
235 Resource existing = advisor.analyzeRoot(graph, root);
237 handles[identity.resource] = builder.handle(existing);
240 else if(definition instanceof Optional) {
241 External def = (External)definition;
242 Resource parent = builder.resource(handles[def.parent]);
244 handles[identity.resource] = builder.handle(graph.syncRequest(new UnescapedChildMapOfResource(parent)).get(def.name));
248 //if(!missingExternals.isEmpty()) throw new MissingDependencyException(this);
253 public Resource createChild(WriteOnlyGraph graph, Resource parent, Resource child, String name) throws DatabaseException {
254 if(child == null) child = graph.newResource();
255 Resource nameResource = graph.newResource();
256 graph.claim(nameResource, InstanceOf, null, String);
257 graph.claimValue(nameResource, name, WriteBindings.STRING);
258 graph.claim(child, HasName, NameOf, nameResource);
262 int[] getClustering() {
263 Variant v = extensions.get(Extensions.CLUSTERING);
264 if(v == null) return null;
266 return (int[])v.getValue(Bindings.INT_ARRAY);
267 } catch (AdaptException e) {
268 Logger.defaultLogError(e);
273 int[] getClusterSets() {
274 Variant v = extensions.get(Extensions.CLUSTER_SETS);
275 if(v == null) return null;
277 return (int[])v.getValue(Bindings.INT_ARRAY);
278 } catch (AdaptException e) {
279 Logger.defaultLogError(e);
284 boolean needTranslation(Datatype type) {
285 return resourceUtil.mayHaveResource(type);
288 void findClusterSet(WriteOnlyGraph graph, Resource rootLibrary, int[] clustering, int[] clusterSets, long[] clusters, int id) throws DatabaseException {
289 ClusteringSupport support = graph.getService(ClusteringSupport.class);
290 if(id == Extensions.ROOT_LIBRARY_CLUSTER_SET || id == Extensions.INDEX_ROOT_CLUSTER_SET) return;
291 Resource indexRootClusterSetResource = rootLibrary;
292 if(indexRoot != null && support.isClusterSet(indexRoot)) {
293 indexRootClusterSetResource = indexRoot;
295 graph.setClusterSet4NewResource(rootLibrary);
296 graph.flushCluster();
298 int indexRootCsHandle = builder.handle(indexRootClusterSetResource);
299 for(int pos=0,index=0;index<clustering.length;index++) {
300 pos += clustering[index];
302 int cs = clusterSets[index];
303 if(handles[id] == 0) {
305 if(cs == Extensions.ROOT_LIBRARY_CLUSTER_SET) csHandle = builder.handle(rootLibrary);
306 else if(cs == Extensions.INDEX_ROOT_CLUSTER_SET) {
307 if(indexRoot == null) throw new DatabaseException("No index root was available in TG import.");
308 csHandle = indexRootCsHandle;
311 findClusterSet(graph, rootLibrary, clustering, clusterSets, clusters, cs);
312 csHandle = handles[cs];
315 if(clusters[index] != 0)
316 builder.selectCluster(clusters[index]);
318 builder.newCluster(csHandle);
320 handles[id] = builder.newResource(csHandle);
321 clusters[index] = support.getCluster(builder.resource(handles[id]));
323 builder.createClusterSet(handles[id]);
330 void createMissing(final WriteOnlyGraph graph) throws Exception {
332 if(allMissingExternals.isEmpty()) return;
334 XSupport xs = graph.getService(XSupport.class);
335 Pair<Boolean,Boolean> serviceMode = xs.getServiceMode();
336 xs.setServiceMode(true, false);
338 ArrayList<String> missing = new ArrayList<>(allMissingExternals.keySet());
339 Collections.sort(missing);
340 for(String uri : missing) {
341 String[] parts = URIStringUtils.splitURI(uri);
342 // URIStringUtils.splitURI returns root URI in non-standard format, so fix it manually as a workaround
343 if (parts[0].equals("http://")) {
347 Resource parent = resolvedParents.get(parts[0]);
348 // TODO: proper exception message
350 throw new IllegalStateException("!!");
353 Resource childResource = graph.newResource();
354 graph.claim(childResource, InstanceOf, null, ExternalEntity);
356 Resource nameResource = graph.newResource();
357 graph.claim(nameResource, InstanceOf, null, String);
358 graph.claimValue(nameResource, URIStringUtils.unescape(parts[1]), WriteBindings.STRING);
359 graph.claim(childResource, HasName, NameOf, nameResource);
361 graph.claim(parent, ConsistsOf, PartOf, childResource);
363 resolvedParents.put(uri, childResource);
365 handles[allMissingExternals.get(uri)] = builder.handle(childResource);
368 xs.setServiceMode(serviceMode.first, serviceMode.second);
372 void write(final WriteOnlyGraph graph) throws Exception {
374 final SerialisationSupport ss = graph.getService(SerialisationSupport.class);
376 ClusterBuilderFactory factory = graph.getService(ClusterBuilderFactory.class);
377 if(advisor instanceof IImportAdvisor2) {
378 boolean allowImmutable = ((IImportAdvisor2)advisor).allowImmutableModifications();
379 builder = factory.create(vg, allowImmutable);
381 builder = factory.create(vg, false);
384 createMissing(graph);
386 final int[] handles = this.handles;
388 int[] clustering = getClustering();
389 if(clustering != null) {
391 int[] clusterSets = getClusterSets();
392 if(clusterSets != null) {
394 assert(clustering.length == clusterSets.length);
396 long[] clusters = new long[clustering.length];
399 for(int i=0;i<clusterSets.length;i++) {
400 findClusterSet(graph, graph.getRootLibrary(), clustering, clusterSets, clusters, clusterSets[i]);
403 // Then create all resources
405 for(int j=0;j<clustering.length;j++) {
406 int c = clustering[j];
407 int s = clusterSets[j];
409 if(s == Extensions.ROOT_LIBRARY_CLUSTER_SET)
410 setHandle = builder.handle(graph.getRootLibrary());
411 else if(s == Extensions.INDEX_ROOT_CLUSTER_SET) {
412 if(indexRoot == null) throw new DatabaseException("No index root was available in TG import.");
413 setHandle = builder.handle(indexRoot);
415 else setHandle = handles[s];
416 // Preserve clustering only for internal resources
418 builder.selectCluster(clusters[j]);
420 builder.newCluster(setHandle);
421 for(int r=0;r<c;r++, i++)
422 if(handles[i] == 0) handles[i] = builder.newResource();
425 for(;i<handles.length;++i)
426 if(handles[i] == 0) handles[i] = builder.newResource();
431 for(int c : clustering) {
432 builder.newCluster();
433 for(int r=0;r<c;r++, i++)
434 if(handles[i] == 0) handles[i] = builder.newResource();
437 for(;i<handles.length;++i)
438 if(handles[i] == 0) handles[i] = builder.newResource();
444 // Create blank resources
445 for(int i=0;i<handles.length;++i)
446 if(handles[i] == 0) handles[i] = builder.newResource();
450 // Internal identities
451 for(Identity identity : identities) {
452 IdentityDefinition definition = identity.definition;
453 // if(handles[identity.resource] != 0)
455 if(definition instanceof External) {
456 // Already done everything
458 else if(definition instanceof Internal) {
459 Internal def = (Internal)definition;
461 Resource external = existingInternalMap.get(identity.resource);
462 if(external != null) {
463 handles[identity.resource] = builder.handle(external);
465 if(handles[identity.resource] != 0)
466 handles[identity.resource] = builder.handle(advisor.createChild(graph, this, builder.resource(handles[def.parent]), builder.resource(handles[identity.resource]), def.name));
468 handles[identity.resource] = builder.handle(advisor.createChild(graph, this, builder.resource(handles[def.parent]), null, def.name));
472 else if(definition instanceof Root) {
474 Root root = (Root)definition;
475 if(handles[identity.resource] != 0)
476 handles[identity.resource] = builder.handle(advisor.createRoot(graph, root, builder.resource(handles[identity.resource])));
478 handles[identity.resource] = builder.handle(advisor.createRoot(graph, root, null));
480 else if(definition instanceof Optional) {
481 Optional def = (Optional)definition;
482 if(handles[identity.resource] != 0) {
483 Resource child = advisor.createChild(graph, this, builder.resource(handles[def.parent]), builder.resource(handles[identity.resource]), def.name);
484 graph.claim(child, InstanceOf, null, Library); // ???
485 handles[identity.resource] = builder.handle(child);
487 Resource child = advisor.createChild(graph, this, builder.resource(handles[def.parent]), null, def.name);
488 graph.claim(child, InstanceOf, null, Library); // ???
489 handles[identity.resource] = builder.handle(child);
495 int[] percentage = { 0 };
497 int statementCount = tg.getStatementCount();
498 tg.forStatements(null, new TransferableGraphSourceProcedure<int[]>() {
501 public void execute(int[] value) throws Exception {
508 int subject = handles[sub];
509 int predicate = handles[pred];
510 int object = handles[obj];
512 builder.addStatement(graph, subject, predicate, object);
514 int inverse = handles[inv];
515 builder.addStatement(graph, object, inverse, subject);
518 // Count from 0% -> 50% => total = statementCount*2
519 percentage[0] = updatePercentage(percentage[0], done[0]++, statementCount*2);
525 int valueCount = tg.getValueCount();
528 class ValueProcedure extends InputStream implements TransferableGraphSourceValueProcedure {
530 private TGResourceUtil util = new TGResourceUtil();
531 private DataInput source;
534 public void execute(int _resource, Datatype type, DataInput stream) throws Exception {
538 //int file = _resource & 0x80000000;
539 int resource = _resource & 0x7FFFFFFF;
541 Binding binding = Bindings.getBinding(type);
542 Serializer s = Bindings.getSerializer(binding);
544 builder.beginValue(handles[resource]);
545 if(util.mayHaveResource(type)) {
546 Object value = s.deserialize(stream);
547 util.adaptValue( binding, value, new LongAdapter() {
549 public long adapt(long in) {
551 return ss.getRandomAccessId(handles[(int)in]);
552 } catch (DatabaseException e) {
553 throw new IllegalStateException(e);
557 byte[] bytes = s.serialize(value);
558 for(byte b : bytes) {
560 if(val < 0) val += 256;
561 builder.appendValue(val);
572 public int read() throws IOException {
573 int value = source.readUnsignedByte();
575 builder.appendValue(value);
576 } catch (DatabaseException e) {
577 LOGGER.error("Failed to write value into database", e);
583 public void rawCopy(int resource, int length, DataInput input) throws Exception {
584 builder.beginValue(handles[resource]);
585 for (int i = 0; i < length; ++i)
586 builder.appendValue(input.readUnsignedByte());
591 private void work() {
592 // Count from 50% -> 100% => [valueCount, valueCount*2)
593 percentage[0] = updatePercentage(percentage[0], valueCount + done[0]++, valueCount*2);
597 tg.forValues2(null, new ValueProcedure());
599 for(Resource r : existingInternalMap.valueCollection()) {
600 graph.deny(r, InstanceOf, null, ExternalEntity, null);
606 public long[] getResourceIds(SerialisationSupport serializer) throws DatabaseException {
607 final int count = handles.length;
608 long[] resourceIds = new long[count];
609 for(int i=0;i<count;++i)
610 resourceIds[i] = serializer.getRandomAccessId(handles[i]);