en:site:recherche:logiciels:sparqlwithspark:watdivs1
Differences
This shows you the differences between two versions of the page.
Both sides previous revisionPrevious revisionNext revision | Previous revision | ||
en:site:recherche:logiciels:sparqlwithspark:watdivs1 [15/09/2016 09:51] – hubert | en:site:recherche:logiciels:sparqlwithspark:watdivs1 [16/09/2016 23:06] (current) – [WatDiv Query S1 plans] hubert | ||
---|---|---|---|
Line 1: | Line 1: | ||
- | ====== WatDiv Query S1 ====== | + | {{indexmenu_n> |
+ | |||
+ | ====== WatDiv Query S1 plans====== | ||
+ | |||
+ | === SPARQL DF plan === | ||
+ | |||
+ | <code scala> | ||
+ | // random partitioning | ||
+ | val DATA = dfDefault | ||
+ | |||
+ | val t1 = DATA.where(s" | ||
+ | val e1 = sc.parallelize(1 to NB_FRAGMENTS, | ||
+ | val t1OK = t1.unionAll(e1) | ||
+ | var plan = t1OK | ||
+ | |||
+ | |||
+ | // ordered by increasing triple tp size | ||
+ | val orderedProp = List( | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | |||
+ | val triples = orderedProp.map{case(ns, | ||
+ | val idP = getIdP(ns, p) | ||
+ | DATA.where(s" | ||
+ | }} | ||
+ | |||
+ | // next triples | ||
+ | for( i <- triples) { | ||
+ | plan = plan.join(i, | ||
+ | } | ||
+ | |||
+ | |||
+ | // Execute query plan for S1 | ||
+ | // | ||
+ | queryTimeDFIter(plan, | ||
+ | // TIME=18.6s | ||
+ | </ | ||
+ | |||
+ | === SPARQL Hybrid DF plan === | ||
+ | |||
+ | <code scala> | ||
+ | |||
+ | val subset = df.where(s" | ||
+ | subset.count | ||
+ | // Merging time=4,885s | ||
+ | |||
+ | val DATA = subset | ||
+ | |||
+ | val t1 = DATA.where(s" | ||
+ | val e1 = sc.parallelize(1 to NB_FRAGMENTS, | ||
+ | val t1OK = t1.unionAll(e1) | ||
+ | var plan = t1OK | ||
+ | |||
+ | |||
+ | // ordered by increasing triple tp size | ||
+ | val orderedProp = List( | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | (" | ||
+ | |||
+ | val triples = orderedProp.map{case(ns, | ||
+ | val idP = getIdP(ns, p) | ||
+ | DATA.where(s" | ||
+ | }} | ||
+ | |||
+ | // next triples | ||
+ | for( i <- triples) { | ||
+ | plan = plan.join(i, | ||
+ | } | ||
+ | |||
+ | |||
+ | // Execute query plan for S1 | ||
+ | // | ||
+ | queryTimeDFIter(plan, | ||
+ | // 2,87 + 4,885 = 7,76s | ||
+ | </ | ||
+ | |||
=== S2RDF plan === | === S2RDF plan === | ||
- | < | + | < |
val VP2EXP=VP2Random | val VP2EXP=VP2Random | ||
Line 37: | Line 125: | ||
=== S2RDF+Hybrid plan === | === S2RDF+Hybrid plan === | ||
- | < | + | < |
// VP's partitioned by subject | // VP's partitioned by subject | ||
val VP2EXP=VP2Subject | val VP2EXP=VP2Subject |
en/site/recherche/logiciels/sparqlwithspark/watdivs1.1473925890.txt.gz · Last modified: by hubert